{ "best_global_step": 2900, "best_metric": 0.5787694388100068, "best_model_checkpoint": "./bert-philosophy-classifier/checkpoint-2000", "epoch": 11.971830985915492, "eval_steps": 100, "global_step": 3400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0, "step": 0, "train/classification_loss": 0.6910466551780701, "train/contrastive_loss": 8.255268096923828, "train/negative_loss": 8.255146026611328, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.00012198019248899072, "train/total_loss": 2.3421003818511963 }, { "epoch": 0, "step": 0, "train/classification_loss": 0.6955318450927734, "train/contrastive_loss": 8.37961196899414, "train/negative_loss": 8.379453659057617, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.00015867262845858932, "train/total_loss": 2.3714542388916016 }, { "epoch": 0.176056338028169, "grad_norm": 16.515756607055664, "learning_rate": 9.4e-06, "loss": 3.5924, "step": 50 }, { "epoch": 0.176056338028169, "step": 50, "train/classification_loss": 0.6504760384559631, "train/contrastive_loss": 2.0566799640655518, "train/negative_loss": 2.038007974624634, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.01867193542420864, "train/total_loss": 1.0618120431900024 }, { "epoch": 0.176056338028169, "step": 50, "train/classification_loss": 0.6553352475166321, "train/contrastive_loss": 2.5260558128356934, "train/negative_loss": 2.4801580905914307, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.04589761793613434, "train/total_loss": 1.1605464220046997 }, { "epoch": 0.352112676056338, "grad_norm": 15.680583953857422, "learning_rate": 1.94e-05, "loss": 1.9545, "step": 100 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5292062163352966, "train/contrastive_loss": 2.306614637374878, "train/negative_loss": 2.2695488929748535, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.037065789103507996, "train/total_loss": 0.9905291795730591 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5466294288635254, "train/contrastive_loss": 1.9586219787597656, "train/negative_loss": 1.9250495433807373, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.033572472631931305, "train/total_loss": 0.9383538365364075 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5346500873565674, "train/contrastive_loss": 1.781119704246521, "train/negative_loss": 1.5406951904296875, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.24042446911334991, "train/total_loss": 0.8908740282058716 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5251791477203369, "train/contrastive_loss": 3.1425154209136963, "train/negative_loss": 2.693556785583496, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4489586651325226, "train/total_loss": 1.1536822319030762 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5305714011192322, "train/contrastive_loss": 3.5068647861480713, "train/negative_loss": 3.474233388900757, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.03263139724731445, "train/total_loss": 1.2319443225860596 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5261136889457703, "train/contrastive_loss": 2.0268311500549316, "train/negative_loss": 1.752275824546814, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.2745553255081177, "train/total_loss": 0.9314799308776855 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5449552536010742, "train/contrastive_loss": 1.596300721168518, "train/negative_loss": 1.2735298871994019, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.3227708041667938, "train/total_loss": 0.8642153739929199 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5408021211624146, "train/contrastive_loss": 1.4297927618026733, "train/negative_loss": 1.4292274713516235, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.0005652713589370251, "train/total_loss": 0.8267606496810913 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.546276867389679, "train/contrastive_loss": 1.0722688436508179, "train/negative_loss": 1.0496809482574463, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.022587856277823448, "train/total_loss": 0.7607306241989136 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5323413610458374, "train/contrastive_loss": 2.9199142456054688, "train/negative_loss": 1.6162124872207642, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.3037017583847046, "train/total_loss": 1.1163241863250732 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5450893044471741, "train/contrastive_loss": 2.1610963344573975, "train/negative_loss": 2.000896453857422, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.1601998507976532, "train/total_loss": 0.9773085713386536 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5373836755752563, "train/contrastive_loss": 1.8006857633590698, "train/negative_loss": 1.7946306467056274, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.006055121775716543, "train/total_loss": 0.8975208401679993 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.523068904876709, "train/contrastive_loss": 3.6596007347106934, "train/negative_loss": 3.1865477561950684, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.47305306792259216, "train/total_loss": 1.2549891471862793 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5393645167350769, "train/contrastive_loss": 2.5353968143463135, "train/negative_loss": 2.22615909576416, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.30923765897750854, "train/total_loss": 1.0464439392089844 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5152075290679932, "train/contrastive_loss": 3.255272626876831, "train/negative_loss": 2.8025577068328857, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.4527149796485901, "train/total_loss": 1.166262149810791 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.532563328742981, "train/contrastive_loss": 2.4751503467559814, "train/negative_loss": 1.9839431047439575, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.49120721220970154, "train/total_loss": 1.0275933742523193 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5331189036369324, "train/contrastive_loss": 2.0612425804138184, "train/negative_loss": 1.8743646144866943, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.1868780106306076, "train/total_loss": 0.9453674554824829 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5387558937072754, "train/contrastive_loss": 3.6453282833099365, "train/negative_loss": 3.446204662322998, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.19912365078926086, "train/total_loss": 1.2678215503692627 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5483106374740601, "train/contrastive_loss": 1.8980530500411987, "train/negative_loss": 1.8654059171676636, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.032647132873535156, "train/total_loss": 0.9279212951660156 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5107576251029968, "train/contrastive_loss": 3.270677328109741, "train/negative_loss": 3.239260673522949, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.03141666576266289, "train/total_loss": 1.1648931503295898 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5458145141601562, "train/contrastive_loss": 1.5782126188278198, "train/negative_loss": 1.5090008974075317, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.0692116767168045, "train/total_loss": 0.8614570498466492 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5230406522750854, "train/contrastive_loss": 2.8396332263946533, "train/negative_loss": 2.7991995811462402, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.04043358564376831, "train/total_loss": 1.0909672975540161 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5388726592063904, "train/contrastive_loss": 2.4029741287231445, "train/negative_loss": 2.341367721557617, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.06160643696784973, "train/total_loss": 1.0194674730300903 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5483464598655701, "train/contrastive_loss": 2.159550905227661, "train/negative_loss": 1.6986929178237915, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.46085792779922485, "train/total_loss": 0.9802566766738892 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5432572960853577, "train/contrastive_loss": 1.7347164154052734, "train/negative_loss": 1.6608059406280518, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0739104300737381, "train/total_loss": 0.8902006149291992 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5226185917854309, "train/contrastive_loss": 2.3534626960754395, "train/negative_loss": 2.00205659866333, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.35140615701675415, "train/total_loss": 0.9933111667633057 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5365185737609863, "train/contrastive_loss": 4.000570297241211, "train/negative_loss": 2.8349084854125977, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 1.1656616926193237, "train/total_loss": 1.3366327285766602 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5436530709266663, "train/contrastive_loss": 2.752227306365967, "train/negative_loss": 2.3868792057037354, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.36534813046455383, "train/total_loss": 1.0940985679626465 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5252662301063538, "train/contrastive_loss": 3.149979591369629, "train/negative_loss": 2.1100027561187744, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.0399768352508545, "train/total_loss": 1.1552622318267822 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.53873211145401, "train/contrastive_loss": 2.7749056816101074, "train/negative_loss": 2.756542205810547, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.01836339570581913, "train/total_loss": 1.0937132835388184 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5252187848091125, "train/contrastive_loss": 1.385758876800537, "train/negative_loss": 1.364824652671814, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.020934201776981354, "train/total_loss": 0.802370548248291 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5307956337928772, "train/contrastive_loss": 2.145063638687134, "train/negative_loss": 1.7865453958511353, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.3585182726383209, "train/total_loss": 0.959808349609375 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5319681763648987, "train/contrastive_loss": 2.523132085800171, "train/negative_loss": 2.286376714706421, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.2367553412914276, "train/total_loss": 1.0365946292877197 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5492977499961853, "train/contrastive_loss": 2.4941790103912354, "train/negative_loss": 1.497723937034607, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.9964550733566284, "train/total_loss": 1.0481336116790771 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5363556146621704, "train/contrastive_loss": 1.8118360042572021, "train/negative_loss": 1.7267634868621826, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.08507253974676132, "train/total_loss": 0.8987228274345398 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5309258699417114, "train/contrastive_loss": 2.3783364295959473, "train/negative_loss": 2.352630376815796, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.025705955922603607, "train/total_loss": 1.0065932273864746 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5422551035881042, "train/contrastive_loss": 1.544332504272461, "train/negative_loss": 1.3956546783447266, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.14867788553237915, "train/total_loss": 0.8511216044425964 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5545170903205872, "train/contrastive_loss": 2.345576047897339, "train/negative_loss": 2.2640533447265625, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.0815226212143898, "train/total_loss": 1.023632287979126 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5410986542701721, "train/contrastive_loss": 2.3546016216278076, "train/negative_loss": 2.3232460021972656, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.031355615705251694, "train/total_loss": 1.0120189189910889 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5399579405784607, "train/contrastive_loss": 1.6408647298812866, "train/negative_loss": 1.4657557010650635, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 0.17510902881622314, "train/total_loss": 0.8681309223175049 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5184195637702942, "train/contrastive_loss": 1.8366289138793945, "train/negative_loss": 1.2438676357269287, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.592761218547821, "train/total_loss": 0.8857453465461731 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5257993936538696, "train/contrastive_loss": 3.42195987701416, "train/negative_loss": 2.86478328704834, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5571765303611755, "train/total_loss": 1.2101913690567017 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.544603705406189, "train/contrastive_loss": 2.036705493927002, "train/negative_loss": 1.905866026878357, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.13083946704864502, "train/total_loss": 0.9519448280334473 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5267763733863831, "train/contrastive_loss": 1.8731989860534668, "train/negative_loss": 1.8441189527511597, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.029080014675855637, "train/total_loss": 0.9014161825180054 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5378268957138062, "train/contrastive_loss": 2.221756935119629, "train/negative_loss": 1.9916719198226929, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.23008498549461365, "train/total_loss": 0.9821783304214478 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5418212413787842, "train/contrastive_loss": 4.279918193817139, "train/negative_loss": 3.504610300064087, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.7753080129623413, "train/total_loss": 1.3978049755096436 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5320029854774475, "train/contrastive_loss": 2.450683832168579, "train/negative_loss": 1.5620760917663574, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.8886077404022217, "train/total_loss": 1.0221397876739502 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5374838709831238, "train/contrastive_loss": 2.0769155025482178, "train/negative_loss": 1.8300950527191162, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.24682042002677917, "train/total_loss": 0.9528669714927673 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5383163094520569, "train/contrastive_loss": 3.6867856979370117, "train/negative_loss": 3.633483409881592, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.05330224335193634, "train/total_loss": 1.2756733894348145 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5388382077217102, "train/contrastive_loss": 2.449093818664551, "train/negative_loss": 1.6639244556427002, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.785169243812561, "train/total_loss": 1.0286569595336914 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5398443937301636, "train/contrastive_loss": 3.40635085105896, "train/negative_loss": 3.386542320251465, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.019808607175946236, "train/total_loss": 1.2211146354675293 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.541286826133728, "train/contrastive_loss": 2.3181488513946533, "train/negative_loss": 1.805355429649353, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.5127934217453003, "train/total_loss": 1.0049166679382324 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5403976440429688, "train/contrastive_loss": 1.7116339206695557, "train/negative_loss": 1.5584475994110107, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.15318630635738373, "train/total_loss": 0.882724404335022 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5545975565910339, "train/contrastive_loss": 2.685664176940918, "train/negative_loss": 2.6671087741851807, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.01855549030005932, "train/total_loss": 1.0917303562164307 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5304739475250244, "train/contrastive_loss": 1.4997867345809937, "train/negative_loss": 1.4348959922790527, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.06489069759845734, "train/total_loss": 0.830431342124939 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.528757631778717, "train/contrastive_loss": 3.1133694648742676, "train/negative_loss": 3.069612503051758, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.04375695809721947, "train/total_loss": 1.1514315605163574 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5330578684806824, "train/contrastive_loss": 1.3456382751464844, "train/negative_loss": 1.287862777709961, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.05777547508478165, "train/total_loss": 0.8021855354309082 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5354094505310059, "train/contrastive_loss": 2.4783427715301514, "train/negative_loss": 1.6376371383666992, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.8407056331634521, "train/total_loss": 1.0310779809951782 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5385649800300598, "train/contrastive_loss": 2.7976906299591064, "train/negative_loss": 2.7675998210906982, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.03009072318673134, "train/total_loss": 1.0981030464172363 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5312110781669617, "train/contrastive_loss": 1.37204909324646, "train/negative_loss": 1.1857126951217651, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.18633633852005005, "train/total_loss": 0.8056209087371826 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5352913737297058, "train/contrastive_loss": 2.8081698417663574, "train/negative_loss": 2.6742031574249268, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.1339666098356247, "train/total_loss": 1.0969253778457642 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5294104218482971, "train/contrastive_loss": 2.1925151348114014, "train/negative_loss": 2.1897799968719482, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.0027350601740181446, "train/total_loss": 0.9679134488105774 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5238025784492493, "train/contrastive_loss": 2.6010711193084717, "train/negative_loss": 2.353334426879883, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.24773679673671722, "train/total_loss": 1.0440168380737305 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5400266051292419, "train/contrastive_loss": 2.8627476692199707, "train/negative_loss": 2.7112135887145996, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.1515340507030487, "train/total_loss": 1.1125761270523071 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5383491516113281, "train/contrastive_loss": 4.268233299255371, "train/negative_loss": 2.231462001800537, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 2.036771059036255, "train/total_loss": 1.391995906829834 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.532766580581665, "train/contrastive_loss": 2.8463375568389893, "train/negative_loss": 2.8405442237854004, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.005793261807411909, "train/total_loss": 1.102034091949463 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5443864464759827, "train/contrastive_loss": 1.849961757659912, "train/negative_loss": 1.6025692224502563, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.24739256501197815, "train/total_loss": 0.9143787622451782 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.529344916343689, "train/contrastive_loss": 1.9414914846420288, "train/negative_loss": 1.808849573135376, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.1326419562101364, "train/total_loss": 0.9176431894302368 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5177937150001526, "train/contrastive_loss": 2.0468740463256836, "train/negative_loss": 2.005218982696533, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.041655153036117554, "train/total_loss": 0.9271684885025024 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5452139377593994, "train/contrastive_loss": 1.8783801794052124, "train/negative_loss": 1.5115289688110352, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.36685118079185486, "train/total_loss": 0.9208899736404419 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5393397212028503, "train/contrastive_loss": 3.0772385597229004, "train/negative_loss": 2.4198713302612305, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.6573673486709595, "train/total_loss": 1.1547874212265015 }, { "epoch": 0.352112676056338, "eval_exact_match_accuracy": 0.007054673721340388, "eval_hamming_loss": 0.0991804129059031, "eval_loss": 1.0206341743469238, "eval_macro_f1": 0.004705882352941177, "eval_macro_precision": 0.017077798861480076, "eval_macro_recall": 0.00272892662219527, "eval_micro_f1": 0.018480492813141684, "eval_micro_precision": 0.25, "eval_micro_recall": 0.009594882729211088, "eval_runtime": 2.8027, "eval_samples_per_second": 202.303, "eval_steps_per_second": 25.332, "step": 100 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5403586030006409, "train/contrastive_loss": 2.3812899589538574, "train/negative_loss": 1.652747631072998, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.7285423278808594, "train/total_loss": 1.0166165828704834 }, { "epoch": 0.352112676056338, "step": 100, "train/classification_loss": 0.5478186011314392, "train/contrastive_loss": 1.4490203857421875, "train/negative_loss": 1.1485689878463745, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.3004514276981354, "train/total_loss": 0.8376226425170898 }, { "epoch": 0.528169014084507, "grad_norm": 18.845754623413086, "learning_rate": 1.9993375616631433e-05, "loss": 1.6374, "step": 150 }, { "epoch": 0.528169014084507, "step": 150, "train/classification_loss": 0.4399445652961731, "train/contrastive_loss": 1.8953174352645874, "train/negative_loss": 1.2232775688171387, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.6720398664474487, "train/total_loss": 0.8190080523490906 }, { "epoch": 0.528169014084507, "step": 150, "train/classification_loss": 0.45203354954719543, "train/contrastive_loss": 2.333707332611084, "train/negative_loss": 1.3233333826065063, "train/num_negatives": 28, "train/num_positives": 20, "train/positive_loss": 1.0103740692138672, "train/total_loss": 0.9187750220298767 }, { "epoch": 0.704225352112676, "grad_norm": 22.89767837524414, "learning_rate": 1.998632840028189e-05, "loss": 1.4947, "step": 200 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.35212618112564087, "train/contrastive_loss": 2.679692268371582, "train/negative_loss": 2.5468082427978516, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.13288407027721405, "train/total_loss": 0.8880646228790283 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.40419623255729675, "train/contrastive_loss": 2.1445202827453613, "train/negative_loss": 2.1230874061584473, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.02143275737762451, "train/total_loss": 0.8331003189086914 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.36665281653404236, "train/contrastive_loss": 3.2175021171569824, "train/negative_loss": 2.35038685798645, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.8671151995658875, "train/total_loss": 1.0101532936096191 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3220570683479309, "train/contrastive_loss": 3.860135793685913, "train/negative_loss": 3.6707465648651123, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.18938927352428436, "train/total_loss": 1.0940842628479004 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.34903034567832947, "train/contrastive_loss": 4.295506000518799, "train/negative_loss": 4.278042316436768, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.01746382936835289, "train/total_loss": 1.2081315517425537 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3510552644729614, "train/contrastive_loss": 2.4234988689422607, "train/negative_loss": 2.118229389190674, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.3052694797515869, "train/total_loss": 0.8357550501823425 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3522025942802429, "train/contrastive_loss": 2.070845603942871, "train/negative_loss": 1.6335164308547974, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.4373290538787842, "train/total_loss": 0.7663717269897461 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3764512538909912, "train/contrastive_loss": 1.995721697807312, "train/negative_loss": 1.995355486869812, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.0003661587543319911, "train/total_loss": 0.7755956053733826 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3572298586368561, "train/contrastive_loss": 1.0032556056976318, "train/negative_loss": 0.9694838523864746, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.033771805465221405, "train/total_loss": 0.5578809976577759 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3626837134361267, "train/contrastive_loss": 3.458970546722412, "train/negative_loss": 2.631351947784424, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.8276186585426331, "train/total_loss": 1.0544778108596802 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3533361256122589, "train/contrastive_loss": 1.8334563970565796, "train/negative_loss": 1.7719533443450928, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.06150306761264801, "train/total_loss": 0.7200274467468262 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3600704073905945, "train/contrastive_loss": 3.0222949981689453, "train/negative_loss": 2.7934417724609375, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.22885310649871826, "train/total_loss": 0.9645293951034546 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.35269612073898315, "train/contrastive_loss": 5.173518657684326, "train/negative_loss": 4.742369174957275, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.4311496615409851, "train/total_loss": 1.3873999118804932 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.38129597902297974, "train/contrastive_loss": 2.7656726837158203, "train/negative_loss": 2.366760730743408, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.39891207218170166, "train/total_loss": 0.9344305396080017 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3092501163482666, "train/contrastive_loss": 2.5747292041778564, "train/negative_loss": 2.5314383506774902, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.043290793895721436, "train/total_loss": 0.8241959810256958 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3573189377784729, "train/contrastive_loss": 2.508971929550171, "train/negative_loss": 2.380729913711548, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.1282421052455902, "train/total_loss": 0.859113335609436 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.34687700867652893, "train/contrastive_loss": 2.098405599594116, "train/negative_loss": 2.051146984100342, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.047258712351322174, "train/total_loss": 0.7665581703186035 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.35372182726860046, "train/contrastive_loss": 3.717986583709717, "train/negative_loss": 3.0732946395874023, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.6446920037269592, "train/total_loss": 1.0973191261291504 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3786483705043793, "train/contrastive_loss": 2.3159143924713135, "train/negative_loss": 2.2949910163879395, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.020923269912600517, "train/total_loss": 0.8418312668800354 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3270884156227112, "train/contrastive_loss": 3.726046323776245, "train/negative_loss": 3.722228527069092, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.00381774315610528, "train/total_loss": 1.0722976922988892 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3455738127231598, "train/contrastive_loss": 1.8412854671478271, "train/negative_loss": 1.7668914794921875, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.07439402490854263, "train/total_loss": 0.7138309478759766 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.32592976093292236, "train/contrastive_loss": 2.967134952545166, "train/negative_loss": 2.961982488632202, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.005152459722012281, "train/total_loss": 0.9193567633628845 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.36154529452323914, "train/contrastive_loss": 2.2759153842926025, "train/negative_loss": 2.2604081630706787, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.01550716906785965, "train/total_loss": 0.8167283535003662 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3743017017841339, "train/contrastive_loss": 2.1762869358062744, "train/negative_loss": 1.659332513809204, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.5169544219970703, "train/total_loss": 0.8095591068267822 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3658154010772705, "train/contrastive_loss": 1.7418978214263916, "train/negative_loss": 1.726149320602417, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.015748459845781326, "train/total_loss": 0.7141950130462646 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.34862056374549866, "train/contrastive_loss": 3.6049418449401855, "train/negative_loss": 2.9295573234558105, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.6753845810890198, "train/total_loss": 1.0696089267730713 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.362020343542099, "train/contrastive_loss": 3.104332208633423, "train/negative_loss": 3.068046808242798, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.03628542274236679, "train/total_loss": 0.982886791229248 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3686039447784424, "train/contrastive_loss": 2.305522918701172, "train/negative_loss": 2.166105270385742, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.13941775262355804, "train/total_loss": 0.8297085762023926 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3441305160522461, "train/contrastive_loss": 3.7442047595977783, "train/negative_loss": 3.075505495071411, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.6686992049217224, "train/total_loss": 1.0929715633392334 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3799186050891876, "train/contrastive_loss": 2.24226713180542, "train/negative_loss": 1.9748241901397705, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.2674430012702942, "train/total_loss": 0.8283720016479492 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3319740891456604, "train/contrastive_loss": 2.5897202491760254, "train/negative_loss": 2.5885169506073, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0012032873928546906, "train/total_loss": 0.8499181270599365 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.34652575850486755, "train/contrastive_loss": 3.9046382904052734, "train/negative_loss": 3.165811538696289, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.7388266921043396, "train/total_loss": 1.1274534463882446 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3571394085884094, "train/contrastive_loss": 3.291074514389038, "train/negative_loss": 3.213367223739624, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.07770735025405884, "train/total_loss": 1.0153543949127197 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.37590229511260986, "train/contrastive_loss": 2.5141170024871826, "train/negative_loss": 2.1928822994232178, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.3212346136569977, "train/total_loss": 0.8787257075309753 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.38263601064682007, "train/contrastive_loss": 2.3549444675445557, "train/negative_loss": 2.1411330699920654, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.21381144225597382, "train/total_loss": 0.8536249399185181 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3225128948688507, "train/contrastive_loss": 2.863142728805542, "train/negative_loss": 2.797741651535034, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.06540101021528244, "train/total_loss": 0.8951414823532104 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3632167875766754, "train/contrastive_loss": 2.3178040981292725, "train/negative_loss": 2.260415554046631, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.05738852918148041, "train/total_loss": 0.8267775774002075 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.40489381551742554, "train/contrastive_loss": 3.3704092502593994, "train/negative_loss": 3.349266529083252, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.02114260569214821, "train/total_loss": 1.0789756774902344 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3605867326259613, "train/contrastive_loss": 1.298163890838623, "train/negative_loss": 1.2663718461990356, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.03179203346371651, "train/total_loss": 0.6202195286750793 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.36784157156944275, "train/contrastive_loss": 2.1754696369171143, "train/negative_loss": 2.11150860786438, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 0.0639609694480896, "train/total_loss": 0.8029354810714722 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.324373334646225, "train/contrastive_loss": 1.6347603797912598, "train/negative_loss": 1.5759810209274292, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.05877934768795967, "train/total_loss": 0.6513254046440125 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3359071612358093, "train/contrastive_loss": 3.9236061573028564, "train/negative_loss": 3.7024834156036377, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.22112280130386353, "train/total_loss": 1.1206283569335938 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.38063234090805054, "train/contrastive_loss": 1.5380961894989014, "train/negative_loss": 1.5096781253814697, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.02841809019446373, "train/total_loss": 0.6882516145706177 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.35039278864860535, "train/contrastive_loss": 2.1888599395751953, "train/negative_loss": 2.157989263534546, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.03087073564529419, "train/total_loss": 0.7881647944450378 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3656606674194336, "train/contrastive_loss": 2.470716714859009, "train/negative_loss": 2.41229248046875, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.05842426419258118, "train/total_loss": 0.8598040342330933 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.38602688908576965, "train/contrastive_loss": 3.937988758087158, "train/negative_loss": 3.6602749824523926, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.2777137756347656, "train/total_loss": 1.1736246347427368 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3479618430137634, "train/contrastive_loss": 3.955038547515869, "train/negative_loss": 2.2126057147979736, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.7424328327178955, "train/total_loss": 1.1389695405960083 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.35680314898490906, "train/contrastive_loss": 2.5151901245117188, "train/negative_loss": 2.3891406059265137, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.12604950368404388, "train/total_loss": 0.8598412275314331 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.37067681550979614, "train/contrastive_loss": 3.4200215339660645, "train/negative_loss": 3.37809419631958, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.04192742332816124, "train/total_loss": 1.0546810626983643 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3493765592575073, "train/contrastive_loss": 2.4909698963165283, "train/negative_loss": 2.1821136474609375, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.3088562786579132, "train/total_loss": 0.847570538520813 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.37985509634017944, "train/contrastive_loss": 2.908679962158203, "train/negative_loss": 2.8500924110412598, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.058587461709976196, "train/total_loss": 0.9615911245346069 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.37945207953453064, "train/contrastive_loss": 2.2139487266540527, "train/negative_loss": 2.086418867111206, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.1275298297405243, "train/total_loss": 0.8222418427467346 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3666813373565674, "train/contrastive_loss": 1.779737949371338, "train/negative_loss": 1.7209254503250122, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.058812472969293594, "train/total_loss": 0.7226289510726929 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.4065815210342407, "train/contrastive_loss": 3.4165267944335938, "train/negative_loss": 3.373825788497925, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.04270093888044357, "train/total_loss": 1.0898869037628174 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.33919551968574524, "train/contrastive_loss": 2.654151439666748, "train/negative_loss": 2.6463871002197266, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.007764222100377083, "train/total_loss": 0.8700258731842041 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.33839792013168335, "train/contrastive_loss": 2.9100310802459717, "train/negative_loss": 2.9021646976470947, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.007866277359426022, "train/total_loss": 0.9204041361808777 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3517836332321167, "train/contrastive_loss": 2.234933614730835, "train/negative_loss": 2.2329797744750977, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.0019538896158337593, "train/total_loss": 0.7987703680992126 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.36322763562202454, "train/contrastive_loss": 4.510669708251953, "train/negative_loss": 2.5318989753723145, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.9787707328796387, "train/total_loss": 1.2653615474700928 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.36761924624443054, "train/contrastive_loss": 2.8496103286743164, "train/negative_loss": 2.7521278858184814, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.09748252481222153, "train/total_loss": 0.9375413656234741 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.350806325674057, "train/contrastive_loss": 1.2713918685913086, "train/negative_loss": 1.189595341682434, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.08179657906293869, "train/total_loss": 0.6050847172737122 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.35948753356933594, "train/contrastive_loss": 3.549363851547241, "train/negative_loss": 3.200535535812378, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.34882837533950806, "train/total_loss": 1.0693602561950684 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3650091290473938, "train/contrastive_loss": 3.3538875579833984, "train/negative_loss": 3.3494699001312256, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.00441768579185009, "train/total_loss": 1.0357866287231445 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3346955478191376, "train/contrastive_loss": 3.4461872577667236, "train/negative_loss": 3.434870481491089, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.01131683774292469, "train/total_loss": 1.0239330530166626 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.35658740997314453, "train/contrastive_loss": 3.258201837539673, "train/negative_loss": 3.1837801933288574, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.07442161440849304, "train/total_loss": 1.008227825164795 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3788551390171051, "train/contrastive_loss": 4.408748626708984, "train/negative_loss": 2.54168963432312, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.8670587539672852, "train/total_loss": 1.2606048583984375 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3525297939777374, "train/contrastive_loss": 3.835818290710449, "train/negative_loss": 3.8349013328552246, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.0009169792756438255, "train/total_loss": 1.1196935176849365 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3724968135356903, "train/contrastive_loss": 1.8083879947662354, "train/negative_loss": 1.6629879474639893, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.14540009200572968, "train/total_loss": 0.7341744303703308 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3550809919834137, "train/contrastive_loss": 2.303849458694458, "train/negative_loss": 2.2234840393066406, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.08036541193723679, "train/total_loss": 0.8158508539199829 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.32960572838783264, "train/contrastive_loss": 3.2862935066223145, "train/negative_loss": 3.2755134105682373, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.010780061595141888, "train/total_loss": 0.986864447593689 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.37115204334259033, "train/contrastive_loss": 2.861098289489746, "train/negative_loss": 2.4897360801696777, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.3713622987270355, "train/total_loss": 0.9433717131614685 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.37576794624328613, "train/contrastive_loss": 2.9777140617370605, "train/negative_loss": 2.5580532550811768, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.4196608364582062, "train/total_loss": 0.9713107943534851 }, { "epoch": 0.704225352112676, "eval_exact_match_accuracy": 0.0, "eval_hamming_loss": 0.09720925407199917, "eval_loss": 0.9205195307731628, "eval_macro_f1": 0.0006033182503770739, "eval_macro_precision": 0.058823529411764705, "eval_macro_recall": 0.00030321406913280777, "eval_micro_f1": 0.002129925452609159, "eval_micro_precision": 1.0, "eval_micro_recall": 0.0010660980810234541, "eval_runtime": 2.8545, "eval_samples_per_second": 198.633, "eval_steps_per_second": 24.873, "step": 200 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3534598648548126, "train/contrastive_loss": 1.6415746212005615, "train/negative_loss": 1.2293429374694824, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.4122316539287567, "train/total_loss": 0.6817747950553894 }, { "epoch": 0.704225352112676, "step": 200, "train/classification_loss": 0.3670371174812317, "train/contrastive_loss": 1.2740015983581543, "train/negative_loss": 0.9414844512939453, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.33251717686653137, "train/total_loss": 0.6218374371528625 }, { "epoch": 0.8802816901408451, "grad_norm": 17.732545852661133, "learning_rate": 1.997928118393235e-05, "loss": 1.3539, "step": 250 }, { "epoch": 0.8802816901408451, "step": 250, "train/classification_loss": 0.3377353549003601, "train/contrastive_loss": 2.0764522552490234, "train/negative_loss": 1.2744636535644531, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8019887208938599, "train/total_loss": 0.7530257701873779 }, { "epoch": 0.8802816901408451, "step": 250, "train/classification_loss": 0.3293566405773163, "train/contrastive_loss": 2.125258445739746, "train/negative_loss": 1.2052654027938843, "train/num_negatives": 30, "train/num_positives": 12, "train/positive_loss": 0.9199931621551514, "train/total_loss": 0.7544083595275879 }, { "epoch": 1.056338028169014, "grad_norm": 20.307628631591797, "learning_rate": 1.9972233967582807e-05, "loss": 1.2688, "step": 300 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.30594518780708313, "train/contrastive_loss": 2.4988250732421875, "train/negative_loss": 2.49473237991333, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.004092785529792309, "train/total_loss": 0.8057101964950562 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.36961638927459717, "train/contrastive_loss": 2.229480028152466, "train/negative_loss": 2.1767866611480713, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.05269325524568558, "train/total_loss": 0.8155124187469482 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.31562164425849915, "train/contrastive_loss": 3.3603179454803467, "train/negative_loss": 2.18591570854187, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.1744022369384766, "train/total_loss": 0.9876852035522461 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.260353684425354, "train/contrastive_loss": 2.384992837905884, "train/negative_loss": 2.353367567062378, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.03162530064582825, "train/total_loss": 0.7373522520065308 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.29958847165107727, "train/contrastive_loss": 3.18422269821167, "train/negative_loss": 3.019544839859009, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.1646779477596283, "train/total_loss": 0.9364330768585205 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.30007806420326233, "train/contrastive_loss": 3.0554862022399902, "train/negative_loss": 2.2332777976989746, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.8222082853317261, "train/total_loss": 0.9111753702163696 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.29807448387145996, "train/contrastive_loss": 2.0360546112060547, "train/negative_loss": 1.878265380859375, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.15778911113739014, "train/total_loss": 0.7052854299545288 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.33394795656204224, "train/contrastive_loss": 1.64840829372406, "train/negative_loss": 1.6481661796569824, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.00024208375543821603, "train/total_loss": 0.6636296510696411 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.31289201974868774, "train/contrastive_loss": 1.3649917840957642, "train/negative_loss": 1.2146955728530884, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.1502961814403534, "train/total_loss": 0.5858904123306274 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.31317582726478577, "train/contrastive_loss": 3.554135799407959, "train/negative_loss": 2.103843927383423, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.4502917528152466, "train/total_loss": 1.024003028869629 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2947699725627899, "train/contrastive_loss": 2.4679057598114014, "train/negative_loss": 2.399268865585327, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.06863680481910706, "train/total_loss": 0.7883511185646057 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.31243011355400085, "train/contrastive_loss": 1.931992530822754, "train/negative_loss": 1.9139418601989746, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.018050648272037506, "train/total_loss": 0.6988286375999451 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.29993221163749695, "train/contrastive_loss": 5.04127836227417, "train/negative_loss": 3.258833646774292, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.7824445962905884, "train/total_loss": 1.3081879615783691 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3398338258266449, "train/contrastive_loss": 4.088870048522949, "train/negative_loss": 1.8648176193237305, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 2.224052667617798, "train/total_loss": 1.1576077938079834 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.24651873111724854, "train/contrastive_loss": 2.714564085006714, "train/negative_loss": 2.345625638961792, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.3689383864402771, "train/total_loss": 0.7894315719604492 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3147347569465637, "train/contrastive_loss": 3.5181074142456055, "train/negative_loss": 2.768947124481201, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.7491604089736938, "train/total_loss": 1.0183563232421875 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2947418987751007, "train/contrastive_loss": 2.9206302165985107, "train/negative_loss": 2.7699949741363525, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.15063515305519104, "train/total_loss": 0.8788679838180542 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3061610758304596, "train/contrastive_loss": 3.530163288116455, "train/negative_loss": 3.253753185272217, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.27641019225120544, "train/total_loss": 1.0121937990188599 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3312360644340515, "train/contrastive_loss": 1.7040787935256958, "train/negative_loss": 1.6804348230361938, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.02364397421479225, "train/total_loss": 0.6720517873764038 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.26763319969177246, "train/contrastive_loss": 2.2348668575286865, "train/negative_loss": 2.1961047649383545, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.03876205533742905, "train/total_loss": 0.7146065831184387 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.28071412444114685, "train/contrastive_loss": 1.3188576698303223, "train/negative_loss": 1.1333078145980835, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.185549795627594, "train/total_loss": 0.5444856882095337 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2643817067146301, "train/contrastive_loss": 3.064574718475342, "train/negative_loss": 2.9858994483947754, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.07867515087127686, "train/total_loss": 0.8772966861724854 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3155921697616577, "train/contrastive_loss": 2.911530017852783, "train/negative_loss": 1.8282358646392822, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.0832940340042114, "train/total_loss": 0.8978981971740723 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.33588844537734985, "train/contrastive_loss": 2.692957639694214, "train/negative_loss": 1.6892998218536377, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.0036578178405762, "train/total_loss": 0.8744800090789795 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3198592960834503, "train/contrastive_loss": 2.034044027328491, "train/negative_loss": 1.768754243850708, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.26528987288475037, "train/total_loss": 0.726668119430542 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.29373568296432495, "train/contrastive_loss": 3.501856803894043, "train/negative_loss": 2.3817152976989746, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.1201415061950684, "train/total_loss": 0.9941070675849915 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.31500720977783203, "train/contrastive_loss": 2.423717498779297, "train/negative_loss": 2.421290636062622, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0024269737768918276, "train/total_loss": 0.7997506856918335 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3181622326374054, "train/contrastive_loss": 1.0337097644805908, "train/negative_loss": 1.0289721488952637, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.004737657494843006, "train/total_loss": 0.524904191493988 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2979702651500702, "train/contrastive_loss": 3.610692024230957, "train/negative_loss": 1.9066754579544067, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.7040166854858398, "train/total_loss": 1.020108699798584 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3428727984428406, "train/contrastive_loss": 1.9881088733673096, "train/negative_loss": 1.655469536781311, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.3326393663883209, "train/total_loss": 0.7404946088790894 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2712554633617401, "train/contrastive_loss": 2.010617256164551, "train/negative_loss": 2.006277561187744, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.004339645616710186, "train/total_loss": 0.6733789443969727 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2919139266014099, "train/contrastive_loss": 4.656617641448975, "train/negative_loss": 3.2068932056427, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.449724555015564, "train/total_loss": 1.2232375144958496 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3088808059692383, "train/contrastive_loss": 3.0035738945007324, "train/negative_loss": 2.2147040367126465, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.7888697385787964, "train/total_loss": 0.9095956087112427 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3173966109752655, "train/contrastive_loss": 2.497237205505371, "train/negative_loss": 1.6290912628173828, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.8681459426879883, "train/total_loss": 0.8168440461158752 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.33909109234809875, "train/contrastive_loss": 3.077838897705078, "train/negative_loss": 2.4171860218048096, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.6606528162956238, "train/total_loss": 0.9546588659286499 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.26384925842285156, "train/contrastive_loss": 3.8524835109710693, "train/negative_loss": 3.6561694145202637, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.1963140368461609, "train/total_loss": 1.0343459844589233 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3107200562953949, "train/contrastive_loss": 2.201188087463379, "train/negative_loss": 1.7593269348144531, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.4418611526489258, "train/total_loss": 0.7509576678276062 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3748219311237335, "train/contrastive_loss": 4.88300085067749, "train/negative_loss": 4.8675031661987305, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.015497865155339241, "train/total_loss": 1.3514220714569092 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3118785619735718, "train/contrastive_loss": 1.8053268194198608, "train/negative_loss": 1.709904670715332, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.0954221561551094, "train/total_loss": 0.6729439496994019 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.32360708713531494, "train/contrastive_loss": 3.670279026031494, "train/negative_loss": 3.0591373443603516, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 0.611141562461853, "train/total_loss": 1.0576629638671875 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.26719018816947937, "train/contrastive_loss": 1.7779717445373535, "train/negative_loss": 1.552098035812378, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.22587375342845917, "train/total_loss": 0.6227845549583435 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.27464035153388977, "train/contrastive_loss": 4.823848724365234, "train/negative_loss": 4.2317962646484375, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5920522809028625, "train/total_loss": 1.239410161972046 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3322891294956207, "train/contrastive_loss": 2.0012426376342773, "train/negative_loss": 1.9953967332839966, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.005845996551215649, "train/total_loss": 0.7325376272201538 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3042404353618622, "train/contrastive_loss": 3.341874122619629, "train/negative_loss": 3.3319761753082275, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.009897973388433456, "train/total_loss": 0.9726152420043945 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3163105547428131, "train/contrastive_loss": 2.1025753021240234, "train/negative_loss": 1.6227657794952393, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.47980961203575134, "train/total_loss": 0.7368255853652954 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.35113173723220825, "train/contrastive_loss": 3.732910633087158, "train/negative_loss": 3.2763113975524902, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.45659929513931274, "train/total_loss": 1.0977139472961426 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.28845012187957764, "train/contrastive_loss": 2.3967533111572266, "train/negative_loss": 1.6205039024353027, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.7762492895126343, "train/total_loss": 0.7678008079528809 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.311286598443985, "train/contrastive_loss": 2.243960380554199, "train/negative_loss": 1.697359561920166, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5466007590293884, "train/total_loss": 0.7600786685943604 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.329230934381485, "train/contrastive_loss": 2.6925671100616455, "train/negative_loss": 2.6917529106140137, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.0008141135331243277, "train/total_loss": 0.8677443265914917 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2909841537475586, "train/contrastive_loss": 2.3947298526763916, "train/negative_loss": 1.6677296161651611, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.7270002365112305, "train/total_loss": 0.7699301242828369 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3502001464366913, "train/contrastive_loss": 3.011383056640625, "train/negative_loss": 2.275353193283081, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.736029863357544, "train/total_loss": 0.9524767398834229 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3382168710231781, "train/contrastive_loss": 1.9932276010513306, "train/negative_loss": 1.863538384437561, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.12968920171260834, "train/total_loss": 0.7368624210357666 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.31939324736595154, "train/contrastive_loss": 1.3574552536010742, "train/negative_loss": 1.290783166885376, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.06667205691337585, "train/total_loss": 0.5908843278884888 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.37328213453292847, "train/contrastive_loss": 2.9023702144622803, "train/negative_loss": 2.844270706176758, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.05809956043958664, "train/total_loss": 0.9537562131881714 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.284429669380188, "train/contrastive_loss": 2.50447678565979, "train/negative_loss": 2.5031793117523193, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.0012975239660590887, "train/total_loss": 0.7853250503540039 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.28343111276626587, "train/contrastive_loss": 2.2238190174102783, "train/negative_loss": 2.1554484367370605, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.06837065517902374, "train/total_loss": 0.7281949520111084 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3072069585323334, "train/contrastive_loss": 2.5616800785064697, "train/negative_loss": 2.141780138015747, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.41989991068840027, "train/total_loss": 0.8195430040359497 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3118622303009033, "train/contrastive_loss": 4.651161193847656, "train/negative_loss": 3.265319585800171, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.385841727256775, "train/total_loss": 1.2420945167541504 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.31704023480415344, "train/contrastive_loss": 2.5177791118621826, "train/negative_loss": 2.467808485031128, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.049970537424087524, "train/total_loss": 0.8205960988998413 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2948223352432251, "train/contrastive_loss": 0.7317419648170471, "train/negative_loss": 0.5935785174369812, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.13816343247890472, "train/total_loss": 0.44117075204849243 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3094301223754883, "train/contrastive_loss": 2.8702237606048584, "train/negative_loss": 2.7152650356292725, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.15495876967906952, "train/total_loss": 0.8834748864173889 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3186941146850586, "train/contrastive_loss": 3.375020980834961, "train/negative_loss": 3.3734092712402344, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.0016116963233798742, "train/total_loss": 0.9936982989311218 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2759850323200226, "train/contrastive_loss": 2.366849899291992, "train/negative_loss": 2.1227517127990723, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.2440982311964035, "train/total_loss": 0.7493550181388855 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.30546504259109497, "train/contrastive_loss": 3.506561279296875, "train/negative_loss": 3.472888946533203, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.03367223963141441, "train/total_loss": 1.006777286529541 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.33961692452430725, "train/contrastive_loss": 3.1121997833251953, "train/negative_loss": 2.3136544227600098, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.798545241355896, "train/total_loss": 0.9620568752288818 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2976114749908447, "train/contrastive_loss": 4.00618839263916, "train/negative_loss": 4.005701541900635, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.0004868100513704121, "train/total_loss": 1.0988491773605347 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3231847584247589, "train/contrastive_loss": 1.5908297300338745, "train/negative_loss": 1.5669194459915161, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.02391027845442295, "train/total_loss": 0.6413507461547852 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.31038302183151245, "train/contrastive_loss": 2.4374196529388428, "train/negative_loss": 2.419769048690796, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.017650671303272247, "train/total_loss": 0.797866940498352 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2667391896247864, "train/contrastive_loss": 2.343015193939209, "train/negative_loss": 2.3206093311309814, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.022405769675970078, "train/total_loss": 0.735342264175415 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.32684218883514404, "train/contrastive_loss": 1.964792013168335, "train/negative_loss": 1.7444849014282227, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.22030705213546753, "train/total_loss": 0.719800591468811 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3296954929828644, "train/contrastive_loss": 3.6302342414855957, "train/negative_loss": 2.858065128326416, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.7721689939498901, "train/total_loss": 1.0557423830032349 }, { "epoch": 1.056338028169014, "eval_exact_match_accuracy": 0.0, "eval_hamming_loss": 0.09720925407199917, "eval_loss": 0.8579484224319458, "eval_macro_f1": 0.0006033182503770739, "eval_macro_precision": 0.058823529411764705, "eval_macro_recall": 0.00030321406913280777, "eval_micro_f1": 0.002129925452609159, "eval_micro_precision": 1.0, "eval_micro_recall": 0.0010660980810234541, "eval_runtime": 2.8413, "eval_samples_per_second": 199.558, "eval_steps_per_second": 24.989, "step": 300 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.2964499294757843, "train/contrastive_loss": 2.260348320007324, "train/negative_loss": 1.5223454236984253, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.7380029559135437, "train/total_loss": 0.7485195994377136 }, { "epoch": 1.056338028169014, "step": 300, "train/classification_loss": 0.3303905427455902, "train/contrastive_loss": 2.6616411209106445, "train/negative_loss": 1.471295952796936, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.190345048904419, "train/total_loss": 0.8627188205718994 }, { "epoch": 1.232394366197183, "grad_norm": 22.85978889465332, "learning_rate": 1.9965186751233265e-05, "loss": 1.2471, "step": 350 }, { "epoch": 1.232394366197183, "step": 350, "train/classification_loss": 0.2880552113056183, "train/contrastive_loss": 1.1895866394042969, "train/negative_loss": 1.1130249500274658, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.07656171917915344, "train/total_loss": 0.5259725451469421 }, { "epoch": 1.232394366197183, "step": 350, "train/classification_loss": 0.26903045177459717, "train/contrastive_loss": 1.6373264789581299, "train/negative_loss": 0.9257901310920715, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.7115364074707031, "train/total_loss": 0.5964957475662231 }, { "epoch": 1.408450704225352, "grad_norm": 21.00748062133789, "learning_rate": 1.9958139534883723e-05, "loss": 1.2271, "step": 400 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.28314051032066345, "train/contrastive_loss": 3.6485836505889893, "train/negative_loss": 3.6469433307647705, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.0016404222697019577, "train/total_loss": 1.01285719871521 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.35745859146118164, "train/contrastive_loss": 1.6834310293197632, "train/negative_loss": 1.6269944906234741, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.05643654987215996, "train/total_loss": 0.6941448450088501 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3006758391857147, "train/contrastive_loss": 4.145646572113037, "train/negative_loss": 2.6357791423797607, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.509867548942566, "train/total_loss": 1.1298052072525024 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.22981052100658417, "train/contrastive_loss": 2.5373754501342773, "train/negative_loss": 2.4768316745758057, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.060543760657310486, "train/total_loss": 0.7372856140136719 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2808890640735626, "train/contrastive_loss": 3.290686845779419, "train/negative_loss": 3.189662218093872, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.1010245680809021, "train/total_loss": 0.9390264749526978 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2821494936943054, "train/contrastive_loss": 3.2997570037841797, "train/negative_loss": 2.7153472900390625, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.5844097137451172, "train/total_loss": 0.9421008825302124 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2745994031429291, "train/contrastive_loss": 2.316945791244507, "train/negative_loss": 2.0420944690704346, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.27485138177871704, "train/total_loss": 0.7379885911941528 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.31354820728302, "train/contrastive_loss": 2.1877691745758057, "train/negative_loss": 2.187727212905884, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 4.1962550312746316e-05, "train/total_loss": 0.751102089881897 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.27818140387535095, "train/contrastive_loss": 2.015977382659912, "train/negative_loss": 1.615659236907959, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.4003180265426636, "train/total_loss": 0.6813768744468689 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.29782742261886597, "train/contrastive_loss": 3.6882712841033936, "train/negative_loss": 2.3672292232513428, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.3210420608520508, "train/total_loss": 1.0354816913604736 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2708834409713745, "train/contrastive_loss": 1.884966254234314, "train/negative_loss": 1.7773405313491821, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.10762572288513184, "train/total_loss": 0.6478767395019531 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2913475036621094, "train/contrastive_loss": 2.8310608863830566, "train/negative_loss": 2.1860485076904297, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.6450124382972717, "train/total_loss": 0.8575596809387207 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2809962034225464, "train/contrastive_loss": 4.520957946777344, "train/negative_loss": 3.2867579460144043, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.2342002391815186, "train/total_loss": 1.185187816619873 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3250114917755127, "train/contrastive_loss": 6.256960868835449, "train/negative_loss": 2.8978018760681152, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 3.359158992767334, "train/total_loss": 1.5764037370681763 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.21937939524650574, "train/contrastive_loss": 2.758821725845337, "train/negative_loss": 2.2684803009033203, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.4903413653373718, "train/total_loss": 0.7711437940597534 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2930915057659149, "train/contrastive_loss": 3.8704781532287598, "train/negative_loss": 3.289940357208252, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.5805377960205078, "train/total_loss": 1.0671871900558472 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2719612121582031, "train/contrastive_loss": 2.343186855316162, "train/negative_loss": 2.2578723430633545, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.0853145644068718, "train/total_loss": 0.7405985593795776 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2838720381259918, "train/contrastive_loss": 4.29950475692749, "train/negative_loss": 2.86482572555542, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 1.4346790313720703, "train/total_loss": 1.1437729597091675 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3134099245071411, "train/contrastive_loss": 1.483730673789978, "train/negative_loss": 1.449765682220459, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.03396494314074516, "train/total_loss": 0.6101560592651367 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2442343682050705, "train/contrastive_loss": 2.234797954559326, "train/negative_loss": 2.1959829330444336, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.03881501033902168, "train/total_loss": 0.6911939382553101 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.25493910908699036, "train/contrastive_loss": 1.4183422327041626, "train/negative_loss": 1.3800286054611206, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.03831358626484871, "train/total_loss": 0.5386075973510742 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2346188873052597, "train/contrastive_loss": 2.815380811691284, "train/negative_loss": 2.572707176208496, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.24267353117465973, "train/total_loss": 0.7976951003074646 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2991984188556671, "train/contrastive_loss": 4.171680450439453, "train/negative_loss": 1.799856185913086, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 2.371824264526367, "train/total_loss": 1.133534550666809 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3120678663253784, "train/contrastive_loss": 2.901266098022461, "train/negative_loss": 2.0078399181365967, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.8934262990951538, "train/total_loss": 0.8923211097717285 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.29216432571411133, "train/contrastive_loss": 2.6716737747192383, "train/negative_loss": 1.666440486907959, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.0052334070205688, "train/total_loss": 0.8264991044998169 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.27575424313545227, "train/contrastive_loss": 3.7175068855285645, "train/negative_loss": 2.7596592903137207, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.9578475952148438, "train/total_loss": 1.0192556381225586 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2976415455341339, "train/contrastive_loss": 2.7999374866485596, "train/negative_loss": 2.7792277336120605, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.020709799602627754, "train/total_loss": 0.8576290607452393 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.29993757605552673, "train/contrastive_loss": 0.8771870732307434, "train/negative_loss": 0.8421351909637451, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.0350518561899662, "train/total_loss": 0.4753749966621399 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.280966192483902, "train/contrastive_loss": 3.608607769012451, "train/negative_loss": 2.94978404045105, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.6588236689567566, "train/total_loss": 1.0026878118515015 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.32713279128074646, "train/contrastive_loss": 1.831444501876831, "train/negative_loss": 1.7606438398361206, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.07080063968896866, "train/total_loss": 0.6934217214584351 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.24486862123012543, "train/contrastive_loss": 1.659805178642273, "train/negative_loss": 1.6573882102966309, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0024170209653675556, "train/total_loss": 0.5768296718597412 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2733094394207001, "train/contrastive_loss": 4.90904426574707, "train/negative_loss": 3.468482494354248, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.4405617713928223, "train/total_loss": 1.2551182508468628 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.28643983602523804, "train/contrastive_loss": 3.4082577228546143, "train/negative_loss": 2.7432756423950195, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.66498202085495, "train/total_loss": 0.9680913686752319 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.29841044545173645, "train/contrastive_loss": 2.4200477600097656, "train/negative_loss": 2.043607473373413, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.37644028663635254, "train/total_loss": 0.7824200391769409 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3234871029853821, "train/contrastive_loss": 4.502335548400879, "train/negative_loss": 3.422264575958252, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.080070972442627, "train/total_loss": 1.223954200744629 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.23264829814434052, "train/contrastive_loss": 3.969658136367798, "train/negative_loss": 3.4609906673431396, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5086674690246582, "train/total_loss": 1.0265799760818481 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2903940677642822, "train/contrastive_loss": 2.3835885524749756, "train/negative_loss": 2.3447093963623047, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.03887925297021866, "train/total_loss": 0.7671117782592773 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.35945478081703186, "train/contrastive_loss": 5.76614236831665, "train/negative_loss": 5.759280204772949, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.006862022913992405, "train/total_loss": 1.5126832723617554 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2925422787666321, "train/contrastive_loss": 1.3959766626358032, "train/negative_loss": 1.1795071363449097, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.21646957099437714, "train/total_loss": 0.5717376470565796 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.30739670991897583, "train/contrastive_loss": 4.221601486206055, "train/negative_loss": 4.039336681365967, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 0.18226470053195953, "train/total_loss": 1.151716947555542 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.24188092350959778, "train/contrastive_loss": 2.5173935890197754, "train/negative_loss": 2.0494346618652344, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.467958927154541, "train/total_loss": 0.7453596591949463 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.25453948974609375, "train/contrastive_loss": 5.941244125366211, "train/negative_loss": 4.527768611907959, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.4134756326675415, "train/total_loss": 1.4427883625030518 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.31516823172569275, "train/contrastive_loss": 2.153377056121826, "train/negative_loss": 2.133862018585205, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.01951492205262184, "train/total_loss": 0.7458436489105225 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2895812392234802, "train/contrastive_loss": 3.385507345199585, "train/negative_loss": 3.381545305252075, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.003962024115025997, "train/total_loss": 0.9666827321052551 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.29960328340530396, "train/contrastive_loss": 2.3431429862976074, "train/negative_loss": 1.7375675439834595, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.6055755615234375, "train/total_loss": 0.7682318687438965 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.34186220169067383, "train/contrastive_loss": 4.986680507659912, "train/negative_loss": 4.8491291999816895, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.13755129277706146, "train/total_loss": 1.339198350906372 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2666102647781372, "train/contrastive_loss": 4.593352317810059, "train/negative_loss": 2.2988717555999756, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 2.294480800628662, "train/total_loss": 1.1852807998657227 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.28822842240333557, "train/contrastive_loss": 2.5433995723724365, "train/negative_loss": 2.4596502780914307, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.08374931663274765, "train/total_loss": 0.7969083786010742 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3163786232471466, "train/contrastive_loss": 2.4625463485717773, "train/negative_loss": 2.4441275596618652, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.018418695777654648, "train/total_loss": 0.8088878989219666 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2659255862236023, "train/contrastive_loss": 2.0809900760650635, "train/negative_loss": 1.687066674232483, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.3939233124256134, "train/total_loss": 0.682123601436615 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3270394504070282, "train/contrastive_loss": 2.4765117168426514, "train/negative_loss": 2.187736988067627, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.28877466917037964, "train/total_loss": 0.822341799736023 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3214586079120636, "train/contrastive_loss": 2.243574619293213, "train/negative_loss": 2.226280927658081, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.017293790355324745, "train/total_loss": 0.7701735496520996 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2980997860431671, "train/contrastive_loss": 1.4891579151153564, "train/negative_loss": 1.262666940689087, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.22649097442626953, "train/total_loss": 0.5959314107894897 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3622506260871887, "train/contrastive_loss": 3.5721888542175293, "train/negative_loss": 3.4855449199676514, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.08664385974407196, "train/total_loss": 1.0766884088516235 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2531818449497223, "train/contrastive_loss": 2.639148235321045, "train/negative_loss": 2.637859344482422, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.0012888265773653984, "train/total_loss": 0.7810114622116089 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2568850815296173, "train/contrastive_loss": 2.1130855083465576, "train/negative_loss": 1.893040657043457, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.22004477679729462, "train/total_loss": 0.6795021891593933 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.28819215297698975, "train/contrastive_loss": 3.1632916927337646, "train/negative_loss": 3.134622812271118, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.02866896614432335, "train/total_loss": 0.9208505153656006 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.292076051235199, "train/contrastive_loss": 5.979118347167969, "train/negative_loss": 3.3803794384002686, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 2.5987389087677, "train/total_loss": 1.4878997802734375 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2968142628669739, "train/contrastive_loss": 2.799877166748047, "train/negative_loss": 2.6201677322387695, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.17970947921276093, "train/total_loss": 0.8567897081375122 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2720637023448944, "train/contrastive_loss": 1.3613431453704834, "train/negative_loss": 1.1893391609191895, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.17200396955013275, "train/total_loss": 0.5443323254585266 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2867943346500397, "train/contrastive_loss": 2.043962001800537, "train/negative_loss": 1.7115544080734253, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.332407683134079, "train/total_loss": 0.6955867409706116 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.306005597114563, "train/contrastive_loss": 3.86198091506958, "train/negative_loss": 3.858013391494751, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.003967516124248505, "train/total_loss": 1.078401803970337 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2502118945121765, "train/contrastive_loss": 2.805070400238037, "train/negative_loss": 2.1969077587127686, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.6081627607345581, "train/total_loss": 0.8112260103225708 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2816160321235657, "train/contrastive_loss": 3.772751569747925, "train/negative_loss": 3.761920213699341, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.010831433348357677, "train/total_loss": 1.0361664295196533 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3179038166999817, "train/contrastive_loss": 5.492734909057617, "train/negative_loss": 3.0714924335479736, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 2.4212422370910645, "train/total_loss": 1.4164507389068604 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2772493064403534, "train/contrastive_loss": 2.904123306274414, "train/negative_loss": 2.869365930557251, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.034757260233163834, "train/total_loss": 0.8580739498138428 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.30459970235824585, "train/contrastive_loss": 1.9777851104736328, "train/negative_loss": 1.9691665172576904, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.008618637919425964, "train/total_loss": 0.7001566886901855 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2939474880695343, "train/contrastive_loss": 3.134911298751831, "train/negative_loss": 3.0512232780456543, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0836879089474678, "train/total_loss": 0.9209297895431519 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.2405194342136383, "train/contrastive_loss": 2.8466434478759766, "train/negative_loss": 2.642735719680786, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.203907772898674, "train/total_loss": 0.8098481893539429 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.31088942289352417, "train/contrastive_loss": 3.955350875854492, "train/negative_loss": 2.314692735671997, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.6406581401824951, "train/total_loss": 1.1019595861434937 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3126649260520935, "train/contrastive_loss": 3.1432363986968994, "train/negative_loss": 2.495011329650879, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.6482250690460205, "train/total_loss": 0.9413121938705444 }, { "epoch": 1.408450704225352, "eval_exact_match_accuracy": 0.007054673721340388, "eval_hamming_loss": 0.09627554725593941, "eval_loss": 0.9071576595306396, "eval_macro_f1": 0.0057670126874279125, "eval_macro_precision": 0.058823529411764705, "eval_macro_recall": 0.0030321406913280773, "eval_micro_f1": 0.02109704641350211, "eval_micro_precision": 1.0, "eval_micro_recall": 0.010660980810234541, "eval_runtime": 2.8429, "eval_samples_per_second": 199.446, "eval_steps_per_second": 24.975, "step": 400 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.3063514828681946, "train/contrastive_loss": 0.9124388694763184, "train/negative_loss": 0.6337320804595947, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.27870678901672363, "train/total_loss": 0.4888392686843872 }, { "epoch": 1.408450704225352, "step": 400, "train/classification_loss": 0.28292348980903625, "train/contrastive_loss": 1.2839583158493042, "train/negative_loss": 1.1856136322021484, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.09834469854831696, "train/total_loss": 0.5397151708602905 }, { "epoch": 1.584507042253521, "grad_norm": 20.219684600830078, "learning_rate": 1.995123326286117e-05, "loss": 1.1671, "step": 450 }, { "epoch": 1.584507042253521, "step": 450, "train/classification_loss": 0.2751622498035431, "train/contrastive_loss": 1.8498551845550537, "train/negative_loss": 0.8557652235031128, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.9940899014472961, "train/total_loss": 0.6451332569122314 }, { "epoch": 1.584507042253521, "step": 450, "train/classification_loss": 0.2665400803089142, "train/contrastive_loss": 2.26444673538208, "train/negative_loss": 1.9925936460494995, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.2718530297279358, "train/total_loss": 0.7194294333457947 }, { "epoch": 1.76056338028169, "grad_norm": 13.850686073303223, "learning_rate": 1.994418604651163e-05, "loss": 1.1877, "step": 500 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2746850550174713, "train/contrastive_loss": 2.372941732406616, "train/negative_loss": 2.345904588699341, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.02703716978430748, "train/total_loss": 0.749273419380188 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.3542173504829407, "train/contrastive_loss": 1.5934892892837524, "train/negative_loss": 1.4353690147399902, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.1581203192472458, "train/total_loss": 0.6729152202606201 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2922971546649933, "train/contrastive_loss": 3.7633190155029297, "train/negative_loss": 2.4660730361938477, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.2972458600997925, "train/total_loss": 1.0449609756469727 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.21439695358276367, "train/contrastive_loss": 2.3541316986083984, "train/negative_loss": 1.6336003541946411, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7205313444137573, "train/total_loss": 0.6852233409881592 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2711621820926666, "train/contrastive_loss": 3.327296733856201, "train/negative_loss": 3.0933024883270264, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.2339942753314972, "train/total_loss": 0.9366215467453003 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2754226624965668, "train/contrastive_loss": 3.468142509460449, "train/negative_loss": 2.288297176361084, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.1798453330993652, "train/total_loss": 0.9690511226654053 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2677496671676636, "train/contrastive_loss": 2.6534390449523926, "train/negative_loss": 1.895154356956482, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.7582846283912659, "train/total_loss": 0.7984374761581421 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.3002317249774933, "train/contrastive_loss": 1.6155636310577393, "train/negative_loss": 1.6155221462249756, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 4.1485694964649156e-05, "train/total_loss": 0.6233444213867188 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2563718259334564, "train/contrastive_loss": 1.2085214853286743, "train/negative_loss": 1.031713843345642, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.17680767178535461, "train/total_loss": 0.4980761408805847 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2899928689002991, "train/contrastive_loss": 3.2499887943267822, "train/negative_loss": 1.6832780838012695, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.5667107105255127, "train/total_loss": 0.9399906396865845 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2547776401042938, "train/contrastive_loss": 1.6170804500579834, "train/negative_loss": 1.590372085571289, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.026708392426371574, "train/total_loss": 0.578193724155426 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.27819275856018066, "train/contrastive_loss": 2.675546169281006, "train/negative_loss": 1.767678141593933, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.9078681468963623, "train/total_loss": 0.8133019804954529 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2753927409648895, "train/contrastive_loss": 5.103810787200928, "train/negative_loss": 2.7712783813476562, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.3325324058532715, "train/total_loss": 1.2961549758911133 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.31207919120788574, "train/contrastive_loss": 3.9416584968566895, "train/negative_loss": 2.3110086917877197, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.6306499242782593, "train/total_loss": 1.1004109382629395 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2047160267829895, "train/contrastive_loss": 3.0547940731048584, "train/negative_loss": 1.8693389892578125, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.185455083847046, "train/total_loss": 0.8156748414039612 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.28234678506851196, "train/contrastive_loss": 2.6560606956481934, "train/negative_loss": 2.1974549293518066, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.4586058557033539, "train/total_loss": 0.8135589361190796 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2614976763725281, "train/contrastive_loss": 1.7249749898910522, "train/negative_loss": 1.6987032890319824, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.02627166360616684, "train/total_loss": 0.6064926385879517 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.272960901260376, "train/contrastive_loss": 2.9053120613098145, "train/negative_loss": 1.705049991607666, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 1.200262188911438, "train/total_loss": 0.8540233373641968 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.30305367708206177, "train/contrastive_loss": 1.5640089511871338, "train/negative_loss": 1.4782166481018066, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.08579232543706894, "train/total_loss": 0.6158554553985596 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.23551839590072632, "train/contrastive_loss": 2.1996805667877197, "train/negative_loss": 1.8477649688720703, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.35191550850868225, "train/total_loss": 0.6754544973373413 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.23813864588737488, "train/contrastive_loss": 1.5576269626617432, "train/negative_loss": 1.4352878332138062, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.12233909219503403, "train/total_loss": 0.5496640205383301 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2204272598028183, "train/contrastive_loss": 2.505669355392456, "train/negative_loss": 1.9168288707733154, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.5888404846191406, "train/total_loss": 0.7215611338615417 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.28241947293281555, "train/contrastive_loss": 2.472677230834961, "train/negative_loss": 1.5921576023101807, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.8805195689201355, "train/total_loss": 0.7769548892974854 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2984713912010193, "train/contrastive_loss": 2.957724094390869, "train/negative_loss": 1.658460021018982, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.2992639541625977, "train/total_loss": 0.8900161981582642 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.28209152817726135, "train/contrastive_loss": 2.216071605682373, "train/negative_loss": 1.2685127258300781, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.9475589990615845, "train/total_loss": 0.7253058552742004 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.26708120107650757, "train/contrastive_loss": 3.642721176147461, "train/negative_loss": 2.2846689224243164, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.3580522537231445, "train/total_loss": 0.9956254363059998 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2888607680797577, "train/contrastive_loss": 1.6935940980911255, "train/negative_loss": 1.6417105197906494, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.051883574575185776, "train/total_loss": 0.6275795698165894 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2867181599140167, "train/contrastive_loss": 0.2821022868156433, "train/negative_loss": 0.24514326453208923, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.03695903345942497, "train/total_loss": 0.34313860535621643 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2716374397277832, "train/contrastive_loss": 4.49190616607666, "train/negative_loss": 2.18587064743042, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 2.3060357570648193, "train/total_loss": 1.1700186729431152 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.3197396695613861, "train/contrastive_loss": 1.5733642578125, "train/negative_loss": 0.9986933469772339, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.5746709704399109, "train/total_loss": 0.6344125270843506 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.23270614445209503, "train/contrastive_loss": 1.7262274026870728, "train/negative_loss": 1.7245793342590332, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0016481271013617516, "train/total_loss": 0.5779516100883484 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2607567608356476, "train/contrastive_loss": 5.528561592102051, "train/negative_loss": 2.7974326610565186, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 2.7311289310455322, "train/total_loss": 1.3664690256118774 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.27459150552749634, "train/contrastive_loss": 3.4055511951446533, "train/negative_loss": 2.3855397701263428, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.0200114250183105, "train/total_loss": 0.9557017683982849 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.28914380073547363, "train/contrastive_loss": 1.8177766799926758, "train/negative_loss": 1.659364104270935, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.15841253101825714, "train/total_loss": 0.6526991128921509 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.31958192586898804, "train/contrastive_loss": 3.929149627685547, "train/negative_loss": 2.4659814834594727, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.4631681442260742, "train/total_loss": 1.1054118871688843 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2196313440799713, "train/contrastive_loss": 3.1857128143310547, "train/negative_loss": 2.962709426879883, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.22300350666046143, "train/total_loss": 0.8567739725112915 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.28469201922416687, "train/contrastive_loss": 2.296447992324829, "train/negative_loss": 1.8910917043685913, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.40535634756088257, "train/total_loss": 0.7439815998077393 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.3504771292209625, "train/contrastive_loss": 4.495262145996094, "train/negative_loss": 4.488855838775635, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.0064062997698783875, "train/total_loss": 1.2495296001434326 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.27917760610580444, "train/contrastive_loss": 1.010267734527588, "train/negative_loss": 0.7466593980789185, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.26360830664634705, "train/total_loss": 0.481231153011322 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.3012574315071106, "train/contrastive_loss": 4.016504287719727, "train/negative_loss": 2.8275396823883057, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.18896484375, "train/total_loss": 1.1045582294464111 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2221851497888565, "train/contrastive_loss": 1.6562566757202148, "train/negative_loss": 1.2890082597732544, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.36724844574928284, "train/total_loss": 0.5534365177154541 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.24506540596485138, "train/contrastive_loss": 5.210491180419922, "train/negative_loss": 3.3771255016326904, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.8333656787872314, "train/total_loss": 1.2871637344360352 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.3047761023044586, "train/contrastive_loss": 1.3365381956100464, "train/negative_loss": 1.3220471143722534, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.01449110172688961, "train/total_loss": 0.5720837116241455 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2840941548347473, "train/contrastive_loss": 2.062333345413208, "train/negative_loss": 2.056055784225464, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.0062774671241641045, "train/total_loss": 0.6965608596801758 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.28721535205841064, "train/contrastive_loss": 1.5204625129699707, "train/negative_loss": 1.4459203481674194, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.07454212009906769, "train/total_loss": 0.5913078784942627 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.33346113562583923, "train/contrastive_loss": 3.6520848274230957, "train/negative_loss": 3.217862844467163, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.43422210216522217, "train/total_loss": 1.063878059387207 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.25263580679893494, "train/contrastive_loss": 4.213356971740723, "train/negative_loss": 1.8085908889770508, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 2.404766321182251, "train/total_loss": 1.0953072309494019 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.27537038922309875, "train/contrastive_loss": 1.8133575916290283, "train/negative_loss": 1.4918739795684814, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.3214835524559021, "train/total_loss": 0.6380419135093689 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.31176668405532837, "train/contrastive_loss": 2.0695607662200928, "train/negative_loss": 2.0549192428588867, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.01464143581688404, "train/total_loss": 0.7256788015365601 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2532116770744324, "train/contrastive_loss": 2.148019790649414, "train/negative_loss": 1.1890658140182495, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.958953857421875, "train/total_loss": 0.682815670967102 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.30827730894088745, "train/contrastive_loss": 2.331303358078003, "train/negative_loss": 2.268155813217163, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.06314753741025925, "train/total_loss": 0.774537980556488 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.31441375613212585, "train/contrastive_loss": 1.7953717708587646, "train/negative_loss": 1.6414676904678345, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.1539040207862854, "train/total_loss": 0.6734881401062012 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2828734219074249, "train/contrastive_loss": 1.2499476671218872, "train/negative_loss": 1.1132442951202393, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.13670335710048676, "train/total_loss": 0.5328629612922668 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.35744303464889526, "train/contrastive_loss": 2.8758091926574707, "train/negative_loss": 2.5653278827667236, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.31048136949539185, "train/total_loss": 0.9326049089431763 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.23784872889518738, "train/contrastive_loss": 1.8612314462661743, "train/negative_loss": 1.859705924987793, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.0015254702884703875, "train/total_loss": 0.6100950241088867 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.24389959871768951, "train/contrastive_loss": 1.5987324714660645, "train/negative_loss": 0.9607344269752502, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.6379980444908142, "train/total_loss": 0.5636460781097412 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2681601643562317, "train/contrastive_loss": 2.4863693714141846, "train/negative_loss": 2.1036064624786377, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.3827628493309021, "train/total_loss": 0.7654340267181396 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.28281816840171814, "train/contrastive_loss": 4.531801223754883, "train/negative_loss": 2.6227142810821533, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.909087061882019, "train/total_loss": 1.189178466796875 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2909647524356842, "train/contrastive_loss": 2.298614501953125, "train/negative_loss": 1.843584418296814, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.4550301432609558, "train/total_loss": 0.7506876587867737 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.25383731722831726, "train/contrastive_loss": 0.5181118845939636, "train/negative_loss": 0.4596084654331207, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.058503407984972, "train/total_loss": 0.35745969414711 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.27694326639175415, "train/contrastive_loss": 2.7504169940948486, "train/negative_loss": 1.8726387023925781, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.8777782320976257, "train/total_loss": 0.8270266652107239 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.29925021529197693, "train/contrastive_loss": 2.403785467147827, "train/negative_loss": 2.342350959777832, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.061434555798769, "train/total_loss": 0.7800073027610779 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.23116818070411682, "train/contrastive_loss": 1.8308014869689941, "train/negative_loss": 1.4933220148086548, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.33747944235801697, "train/total_loss": 0.5973284840583801 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.27349355816841125, "train/contrastive_loss": 2.776144504547119, "train/negative_loss": 2.7390992641448975, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.0370451882481575, "train/total_loss": 0.8287224769592285 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.3065961003303528, "train/contrastive_loss": 3.2309837341308594, "train/negative_loss": 1.5713709592819214, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.6596126556396484, "train/total_loss": 0.9527928829193115 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2666000425815582, "train/contrastive_loss": 3.2088193893432617, "train/negative_loss": 3.2054524421691895, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.0033669769763946533, "train/total_loss": 0.908363938331604 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2936076521873474, "train/contrastive_loss": 1.6566014289855957, "train/negative_loss": 1.557382345199585, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.09921909123659134, "train/total_loss": 0.6249279379844666 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2817278504371643, "train/contrastive_loss": 2.2113726139068604, "train/negative_loss": 2.1751155853271484, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.03625708073377609, "train/total_loss": 0.7240023612976074 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.228508859872818, "train/contrastive_loss": 2.889946460723877, "train/negative_loss": 2.2652790546417236, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.6246672868728638, "train/total_loss": 0.8064981698989868 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.30241695046424866, "train/contrastive_loss": 2.6104650497436523, "train/negative_loss": 1.6172579526901245, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.9932072162628174, "train/total_loss": 0.8245099782943726 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.3064451217651367, "train/contrastive_loss": 2.2361652851104736, "train/negative_loss": 1.6052446365356445, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.6309205889701843, "train/total_loss": 0.7536782026290894 }, { "epoch": 1.76056338028169, "eval_exact_match_accuracy": 0.03527336860670194, "eval_hamming_loss": 0.09295570079883805, "eval_loss": 0.7930232286453247, "eval_macro_f1": 0.02187651920272241, "eval_macro_precision": 0.05514705882352941, "eval_macro_recall": 0.01364463311097635, "eval_micro_f1": 0.09127789046653144, "eval_micro_precision": 0.9375, "eval_micro_recall": 0.04797441364605544, "eval_runtime": 2.8414, "eval_samples_per_second": 199.548, "eval_steps_per_second": 24.987, "step": 500 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.272177129983902, "train/contrastive_loss": 1.6633307933807373, "train/negative_loss": 1.0278187990188599, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.6355120539665222, "train/total_loss": 0.604843258857727 }, { "epoch": 1.76056338028169, "step": 500, "train/classification_loss": 0.2887512147426605, "train/contrastive_loss": 1.1888062953948975, "train/negative_loss": 0.9608774185180664, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.22792884707450867, "train/total_loss": 0.5265125036239624 }, { "epoch": 1.936619718309859, "grad_norm": 19.463146209716797, "learning_rate": 1.9937138830162087e-05, "loss": 1.1723, "step": 550 }, { "epoch": 1.936619718309859, "step": 550, "train/classification_loss": 0.26050716638565063, "train/contrastive_loss": 1.7977603673934937, "train/negative_loss": 1.2410331964492798, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.5567271709442139, "train/total_loss": 0.6200592517852783 }, { "epoch": 1.936619718309859, "step": 550, "train/classification_loss": 0.27938032150268555, "train/contrastive_loss": 1.2287302017211914, "train/negative_loss": 1.056685209274292, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.17204496264457703, "train/total_loss": 0.5251263380050659 }, { "epoch": 2.112676056338028, "grad_norm": 13.017983436584473, "learning_rate": 1.9930091613812545e-05, "loss": 1.1545, "step": 600 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2655118405818939, "train/contrastive_loss": 2.7165048122406006, "train/negative_loss": 2.4909591674804688, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.2255457192659378, "train/total_loss": 0.8088128566741943 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.35418999195098877, "train/contrastive_loss": 1.7897865772247314, "train/negative_loss": 1.7852965593338013, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.004490070044994354, "train/total_loss": 0.7121473550796509 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2882835566997528, "train/contrastive_loss": 3.125886917114258, "train/negative_loss": 2.148383617401123, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.9775032997131348, "train/total_loss": 0.9134609699249268 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2018880397081375, "train/contrastive_loss": 2.4460976123809814, "train/negative_loss": 2.344330310821533, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.10176732391119003, "train/total_loss": 0.6911075711250305 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.262895405292511, "train/contrastive_loss": 3.8667688369750977, "train/negative_loss": 3.8429808616638184, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.023787880316376686, "train/total_loss": 1.0362491607666016 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.27121493220329285, "train/contrastive_loss": 3.6091127395629883, "train/negative_loss": 2.9608404636383057, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.6482722759246826, "train/total_loss": 0.9930374622344971 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.25528448820114136, "train/contrastive_loss": 2.0596120357513428, "train/negative_loss": 1.8073989152908325, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.25221318006515503, "train/total_loss": 0.667206883430481 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.29203322529792786, "train/contrastive_loss": 1.5734552145004272, "train/negative_loss": 1.573405385017395, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 4.983072358299978e-05, "train/total_loss": 0.6067242622375488 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2447809875011444, "train/contrastive_loss": 1.3014971017837524, "train/negative_loss": 1.2134637832641602, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.08803336322307587, "train/total_loss": 0.5050804018974304 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.28763678669929504, "train/contrastive_loss": 3.355006694793701, "train/negative_loss": 2.41642165184021, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.9385851621627808, "train/total_loss": 0.9586381912231445 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.24386745691299438, "train/contrastive_loss": 1.6079519987106323, "train/negative_loss": 1.6015613079071045, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.006390690803527832, "train/total_loss": 0.565457820892334 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.27382519841194153, "train/contrastive_loss": 2.1843647956848145, "train/negative_loss": 2.135948657989502, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.048416100442409515, "train/total_loss": 0.710698127746582 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.27145224809646606, "train/contrastive_loss": 5.196383476257324, "train/negative_loss": 4.228582382202148, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.9678012132644653, "train/total_loss": 1.3107290267944336 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.307817280292511, "train/contrastive_loss": 1.743464708328247, "train/negative_loss": 1.4246816635131836, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.31878307461738586, "train/total_loss": 0.6565102338790894 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.19442690908908844, "train/contrastive_loss": 2.4461112022399902, "train/negative_loss": 1.6319011449813843, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.8142101168632507, "train/total_loss": 0.6836491823196411 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.27335432171821594, "train/contrastive_loss": 2.657935380935669, "train/negative_loss": 2.2297253608703613, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.42820996046066284, "train/total_loss": 0.8049414157867432 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.24967409670352936, "train/contrastive_loss": 2.3317456245422363, "train/negative_loss": 2.2358877658843994, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.09585781395435333, "train/total_loss": 0.7160232067108154 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.26585885882377625, "train/contrastive_loss": 2.33823299407959, "train/negative_loss": 2.2738454341888428, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.06438751518726349, "train/total_loss": 0.7335054874420166 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2969436049461365, "train/contrastive_loss": 2.2686820030212402, "train/negative_loss": 2.2569010257720947, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.011780895292758942, "train/total_loss": 0.7506799697875977 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.22988630831241608, "train/contrastive_loss": 2.651657819747925, "train/negative_loss": 2.634925365447998, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.016732439398765564, "train/total_loss": 0.7602178454399109 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.22725173830986023, "train/contrastive_loss": 1.5604908466339111, "train/negative_loss": 1.3795166015625, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.18097421526908875, "train/total_loss": 0.5393499135971069 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.20920825004577637, "train/contrastive_loss": 2.2791993618011475, "train/negative_loss": 2.1695494651794434, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.10964998602867126, "train/total_loss": 0.6650481224060059 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2731555700302124, "train/contrastive_loss": 1.913442850112915, "train/negative_loss": 1.52596116065979, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.3874816298484802, "train/total_loss": 0.6558441519737244 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2883538007736206, "train/contrastive_loss": 3.0538086891174316, "train/negative_loss": 2.366272449493408, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.6875361800193787, "train/total_loss": 0.8991155624389648 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.270912766456604, "train/contrastive_loss": 1.44975745677948, "train/negative_loss": 1.1361711025238037, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.31358638405799866, "train/total_loss": 0.560864269733429 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.25922784209251404, "train/contrastive_loss": 3.3822884559631348, "train/negative_loss": 2.331347703933716, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0509408712387085, "train/total_loss": 0.9356855154037476 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2828563153743744, "train/contrastive_loss": 3.1865062713623047, "train/negative_loss": 3.0384509563446045, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.14805543422698975, "train/total_loss": 0.9201575517654419 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2778072953224182, "train/contrastive_loss": 0.8674440383911133, "train/negative_loss": 0.8614189028739929, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.006025121081620455, "train/total_loss": 0.4512960910797119 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.26533621549606323, "train/contrastive_loss": 4.989627838134766, "train/negative_loss": 2.029449224472046, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 2.960178852081299, "train/total_loss": 1.2632617950439453 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.3142849802970886, "train/contrastive_loss": 2.2525582313537598, "train/negative_loss": 1.6249645948410034, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.6275936961174011, "train/total_loss": 0.7647966146469116 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.22230415046215057, "train/contrastive_loss": 2.341874122619629, "train/negative_loss": 2.341752052307129, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0001221778802573681, "train/total_loss": 0.6906789541244507 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2520856261253357, "train/contrastive_loss": 4.726991176605225, "train/negative_loss": 3.535334825515747, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.191656231880188, "train/total_loss": 1.1974838972091675 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.26316654682159424, "train/contrastive_loss": 3.1302757263183594, "train/negative_loss": 2.7062013149261475, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.4240744113922119, "train/total_loss": 0.889221727848053 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2838142514228821, "train/contrastive_loss": 2.1439647674560547, "train/negative_loss": 1.8014320135116577, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.3425328731536865, "train/total_loss": 0.712607204914093 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.31727495789527893, "train/contrastive_loss": 2.5879080295562744, "train/negative_loss": 1.9560651779174805, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.6318427920341492, "train/total_loss": 0.8348566293716431 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.20751053094863892, "train/contrastive_loss": 3.660047769546509, "train/negative_loss": 3.6077892780303955, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.052258577197790146, "train/total_loss": 0.9395201206207275 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.27994856238365173, "train/contrastive_loss": 3.369920492172241, "train/negative_loss": 2.3817219734191895, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.9881985783576965, "train/total_loss": 0.9539326429367065 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.3470801115036011, "train/contrastive_loss": 3.1829419136047363, "train/negative_loss": 3.1593027114868164, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.023639317601919174, "train/total_loss": 0.9836685061454773 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2744625210762024, "train/contrastive_loss": 0.7977559566497803, "train/negative_loss": 0.795982301235199, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.001773629686795175, "train/total_loss": 0.4340137243270874 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.3006003499031067, "train/contrastive_loss": 3.7789857387542725, "train/negative_loss": 2.5526533126831055, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.226332426071167, "train/total_loss": 1.0563974380493164 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2159285992383957, "train/contrastive_loss": 2.106112241744995, "train/negative_loss": 1.4221737384796143, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.6839384436607361, "train/total_loss": 0.6371510624885559 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2355670928955078, "train/contrastive_loss": 3.8951456546783447, "train/negative_loss": 3.606135129928589, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.2890104651451111, "train/total_loss": 1.0145962238311768 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2983419895172119, "train/contrastive_loss": 1.8662009239196777, "train/negative_loss": 1.8543726205825806, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.011828357353806496, "train/total_loss": 0.6715822219848633 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2829849421977997, "train/contrastive_loss": 2.2853145599365234, "train/negative_loss": 2.2846763134002686, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.0006382851861417294, "train/total_loss": 0.7400478720664978 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.28188222646713257, "train/contrastive_loss": 2.4789621829986572, "train/negative_loss": 2.3751132488250732, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.10384893417358398, "train/total_loss": 0.777674674987793 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.3321971893310547, "train/contrastive_loss": 3.455317497253418, "train/negative_loss": 1.9387705326080322, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.5165468454360962, "train/total_loss": 1.0232607126235962 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.24286231398582458, "train/contrastive_loss": 2.267987012863159, "train/negative_loss": 1.2728211879730225, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.9951657652854919, "train/total_loss": 0.6964597105979919 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2671754062175751, "train/contrastive_loss": 2.7592761516571045, "train/negative_loss": 2.329969882965088, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.42930617928504944, "train/total_loss": 0.8190306425094604 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.30591079592704773, "train/contrastive_loss": 3.1203904151916504, "train/negative_loss": 3.1192197799682617, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.0011705452343448997, "train/total_loss": 0.9299888610839844 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.24307727813720703, "train/contrastive_loss": 3.0907504558563232, "train/negative_loss": 1.889597773551941, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.2011526823043823, "train/total_loss": 0.8612273931503296 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.29708796739578247, "train/contrastive_loss": 3.106224775314331, "train/negative_loss": 2.2909767627716064, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.8152480125427246, "train/total_loss": 0.9183329343795776 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.3065061569213867, "train/contrastive_loss": 0.8311124444007874, "train/negative_loss": 0.8197550773620605, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.01135738380253315, "train/total_loss": 0.4727286696434021 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2737361192703247, "train/contrastive_loss": 1.6114311218261719, "train/negative_loss": 1.4044698476791382, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.2069612443447113, "train/total_loss": 0.596022367477417 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.3517117202281952, "train/contrastive_loss": 2.13155460357666, "train/negative_loss": 2.095580577850342, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.03597412258386612, "train/total_loss": 0.7780226469039917 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.22330208122730255, "train/contrastive_loss": 1.3648285865783691, "train/negative_loss": 1.3604246377944946, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.004403931554406881, "train/total_loss": 0.49626779556274414 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.22920459508895874, "train/contrastive_loss": 1.3932069540023804, "train/negative_loss": 1.3668732643127441, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.02633371204137802, "train/total_loss": 0.5078459978103638 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.25943541526794434, "train/contrastive_loss": 1.3731660842895508, "train/negative_loss": 1.3676259517669678, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.00554013391956687, "train/total_loss": 0.5340686440467834 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2787546217441559, "train/contrastive_loss": 3.2431516647338867, "train/negative_loss": 2.292062997817993, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.9510887265205383, "train/total_loss": 0.9273849725723267 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.285135954618454, "train/contrastive_loss": 2.672668933868408, "train/negative_loss": 2.601151704788208, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.07151711732149124, "train/total_loss": 0.8196697235107422 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.24279852211475372, "train/contrastive_loss": 0.33092400431632996, "train/negative_loss": 0.2881507873535156, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.04277321696281433, "train/total_loss": 0.30898332595825195 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.26458054780960083, "train/contrastive_loss": 2.991323471069336, "train/negative_loss": 2.2940022945404053, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.6973210573196411, "train/total_loss": 0.862845242023468 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2952703535556793, "train/contrastive_loss": 2.254122495651245, "train/negative_loss": 2.0741899013519287, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.17993269860744476, "train/total_loss": 0.746094822883606 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.21956709027290344, "train/contrastive_loss": 2.3346047401428223, "train/negative_loss": 2.2797367572784424, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.05486806854605675, "train/total_loss": 0.6864880323410034 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.26317569613456726, "train/contrastive_loss": 2.884903907775879, "train/negative_loss": 2.835430860519409, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.04947293549776077, "train/total_loss": 0.8401564359664917 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2982771098613739, "train/contrastive_loss": 1.7770580053329468, "train/negative_loss": 1.4397709369659424, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.337287038564682, "train/total_loss": 0.6536887288093567 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2596679925918579, "train/contrastive_loss": 5.190526485443115, "train/negative_loss": 5.189894199371338, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.0006320484098978341, "train/total_loss": 1.2977733612060547 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.2867215573787689, "train/contrastive_loss": 1.3076599836349487, "train/negative_loss": 1.1543831825256348, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.15327675640583038, "train/total_loss": 0.5482535362243652 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.27485737204551697, "train/contrastive_loss": 2.8145785331726074, "train/negative_loss": 2.7869348526000977, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.027643561363220215, "train/total_loss": 0.8377730846405029 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.22017274796962738, "train/contrastive_loss": 2.8017265796661377, "train/negative_loss": 2.6876823902130127, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.11404415220022202, "train/total_loss": 0.780518114566803 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.29706528782844543, "train/contrastive_loss": 1.893568992614746, "train/negative_loss": 1.7392206192016602, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.15434837341308594, "train/total_loss": 0.6757791042327881 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.29672476649284363, "train/contrastive_loss": 2.324429988861084, "train/negative_loss": 2.2799794673919678, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.044450610876083374, "train/total_loss": 0.761610746383667 }, { "epoch": 2.112676056338028, "eval_exact_match_accuracy": 0.06701940035273368, "eval_hamming_loss": 0.08942836393816786, "eval_loss": 0.7768438458442688, "eval_macro_f1": 0.03455368161250514, "eval_macro_precision": 0.053708439897698204, "eval_macro_recall": 0.025469981807155852, "eval_micro_f1": 0.16310679611650486, "eval_micro_precision": 0.9130434782608695, "eval_micro_recall": 0.08955223880597014, "eval_runtime": 2.8443, "eval_samples_per_second": 199.346, "eval_steps_per_second": 24.962, "step": 600 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.23301708698272705, "train/contrastive_loss": 1.0185050964355469, "train/negative_loss": 0.9255691170692444, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.0929359570145607, "train/total_loss": 0.4367181062698364 }, { "epoch": 2.112676056338028, "step": 600, "train/classification_loss": 0.30060961842536926, "train/contrastive_loss": 1.328704833984375, "train/negative_loss": 1.2900022268295288, "train/num_negatives": 54, "train/num_positives": 2, "train/positive_loss": 0.038702648133039474, "train/total_loss": 0.5663505792617798 }, { "epoch": 2.288732394366197, "grad_norm": 14.132761001586914, "learning_rate": 1.9923044397463003e-05, "loss": 1.141, "step": 650 }, { "epoch": 2.288732394366197, "step": 650, "train/classification_loss": 0.26593494415283203, "train/contrastive_loss": 1.434600591659546, "train/negative_loss": 1.0088177919387817, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.42578282952308655, "train/total_loss": 0.5528550744056702 }, { "epoch": 2.288732394366197, "step": 650, "train/classification_loss": 0.33469271659851074, "train/contrastive_loss": 0.9574272632598877, "train/negative_loss": 0.6218593716621399, "train/num_negatives": 26, "train/num_positives": 10, "train/positive_loss": 0.3355679214000702, "train/total_loss": 0.5261781811714172 }, { "epoch": 2.464788732394366, "grad_norm": 11.614706993103027, "learning_rate": 1.991599718111346e-05, "loss": 1.1276, "step": 700 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.26160183548927307, "train/contrastive_loss": 2.009491205215454, "train/negative_loss": 2.0051932334899902, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.004298079758882523, "train/total_loss": 0.6635000705718994 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.3489950895309448, "train/contrastive_loss": 1.4548521041870117, "train/negative_loss": 1.4246387481689453, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.03021341562271118, "train/total_loss": 0.6399655342102051 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.28580397367477417, "train/contrastive_loss": 2.9900283813476562, "train/negative_loss": 1.9930967092514038, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.996931791305542, "train/total_loss": 0.8838096857070923 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.19340381026268005, "train/contrastive_loss": 1.8040951490402222, "train/negative_loss": 1.3891160488128662, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.41497907042503357, "train/total_loss": 0.554222822189331 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2559998333454132, "train/contrastive_loss": 3.1747539043426514, "train/negative_loss": 2.8927342891693115, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.2820196747779846, "train/total_loss": 0.8909506797790527 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.26788848638534546, "train/contrastive_loss": 2.892021656036377, "train/negative_loss": 2.1982061862945557, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.6938154101371765, "train/total_loss": 0.8462928533554077 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.24627529084682465, "train/contrastive_loss": 2.3007020950317383, "train/negative_loss": 1.1821531057357788, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.1185489892959595, "train/total_loss": 0.7064157128334045 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.27907198667526245, "train/contrastive_loss": 1.1958181858062744, "train/negative_loss": 1.195792317390442, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 2.5868750526569784e-05, "train/total_loss": 0.5182356238365173 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.22659878432750702, "train/contrastive_loss": 1.5324945449829102, "train/negative_loss": 1.1574326753616333, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.37506192922592163, "train/total_loss": 0.5330976843833923 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2787783443927765, "train/contrastive_loss": 2.935335874557495, "train/negative_loss": 1.3649426698684692, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.5703932046890259, "train/total_loss": 0.8658455610275269 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2323508858680725, "train/contrastive_loss": 1.201979398727417, "train/negative_loss": 1.1058276891708374, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.0961516723036766, "train/total_loss": 0.4727467894554138 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.26310840249061584, "train/contrastive_loss": 1.5375195741653442, "train/negative_loss": 1.4847670793533325, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.052752535790205, "train/total_loss": 0.5706123113632202 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.26589787006378174, "train/contrastive_loss": 5.935999870300293, "train/negative_loss": 3.2628040313720703, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.6731958389282227, "train/total_loss": 1.4530978202819824 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.29565703868865967, "train/contrastive_loss": 1.8856391906738281, "train/negative_loss": 1.7572426795959473, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.12839657068252563, "train/total_loss": 0.6727849245071411 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.1868654489517212, "train/contrastive_loss": 2.650007486343384, "train/negative_loss": 1.233117938041687, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.4168895483016968, "train/total_loss": 0.7168669700622559 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2679687440395355, "train/contrastive_loss": 2.0526623725891113, "train/negative_loss": 1.8156697750091553, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.23699267208576202, "train/total_loss": 0.6785012483596802 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2409229278564453, "train/contrastive_loss": 2.007019519805908, "train/negative_loss": 1.8985358476638794, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.10848365724086761, "train/total_loss": 0.642326831817627 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.25849634408950806, "train/contrastive_loss": 1.664421796798706, "train/negative_loss": 1.496127724647522, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.1682940572500229, "train/total_loss": 0.5913807153701782 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.28674477338790894, "train/contrastive_loss": 2.489363670349121, "train/negative_loss": 2.305185556411743, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.18417812883853912, "train/total_loss": 0.78461754322052 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.22376161813735962, "train/contrastive_loss": 2.142667770385742, "train/negative_loss": 1.9347009658813477, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.20796677470207214, "train/total_loss": 0.6522951722145081 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.21757212281227112, "train/contrastive_loss": 1.4172059297561646, "train/negative_loss": 1.3893778324127197, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.02782805822789669, "train/total_loss": 0.5010132789611816 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.1990765482187271, "train/contrastive_loss": 2.7547669410705566, "train/negative_loss": 2.121692180633545, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.6330747604370117, "train/total_loss": 0.7500299215316772 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.26614558696746826, "train/contrastive_loss": 1.6581043004989624, "train/negative_loss": 1.2447292804718018, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.41337499022483826, "train/total_loss": 0.5977664589881897 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2881677448749542, "train/contrastive_loss": 3.0211892127990723, "train/negative_loss": 1.4713469743728638, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.549842357635498, "train/total_loss": 0.89240562915802 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.26242172718048096, "train/contrastive_loss": 1.866014003753662, "train/negative_loss": 1.0343221426010132, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.8316918611526489, "train/total_loss": 0.6356245279312134 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.25315940380096436, "train/contrastive_loss": 3.169330596923828, "train/negative_loss": 2.0961296558380127, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0732009410858154, "train/total_loss": 0.8870255351066589 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2769738435745239, "train/contrastive_loss": 2.8473868370056152, "train/negative_loss": 2.842177152633667, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.005209724418818951, "train/total_loss": 0.8464512228965759 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2702639102935791, "train/contrastive_loss": 0.43696677684783936, "train/negative_loss": 0.4276716709136963, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.009295119903981686, "train/total_loss": 0.357657253742218 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2649320363998413, "train/contrastive_loss": 4.0508856773376465, "train/negative_loss": 1.8131588697433472, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 2.237726926803589, "train/total_loss": 1.0751092433929443 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.3046039640903473, "train/contrastive_loss": 1.2810300588607788, "train/negative_loss": 1.1386232376098633, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.14240680634975433, "train/total_loss": 0.5608099699020386 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.21259135007858276, "train/contrastive_loss": 1.4091565608978271, "train/negative_loss": 1.408933401107788, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0002231640974059701, "train/total_loss": 0.49442267417907715 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2486288696527481, "train/contrastive_loss": 4.611261367797852, "train/negative_loss": 2.3544013500213623, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 2.2568600177764893, "train/total_loss": 1.1708811521530151 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.25692251324653625, "train/contrastive_loss": 3.3561017513275146, "train/negative_loss": 2.010610580444336, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.3454911708831787, "train/total_loss": 0.9281429052352905 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.27464237809181213, "train/contrastive_loss": 1.9858033657073975, "train/negative_loss": 1.7059353590011597, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.2798679769039154, "train/total_loss": 0.6718030571937561 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.31064096093177795, "train/contrastive_loss": 2.6247735023498535, "train/negative_loss": 2.1107285022735596, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.514045000076294, "train/total_loss": 0.8355957269668579 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.19985580444335938, "train/contrastive_loss": 3.0397794246673584, "train/negative_loss": 2.7400920391082764, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.29968732595443726, "train/total_loss": 0.8078116774559021 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.27227783203125, "train/contrastive_loss": 1.791211485862732, "train/negative_loss": 1.4521441459655762, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.33906733989715576, "train/total_loss": 0.6305201053619385 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.3416289985179901, "train/contrastive_loss": 3.330692768096924, "train/negative_loss": 3.3222756385803223, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.00841722171753645, "train/total_loss": 1.0077675580978394 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.26505497097969055, "train/contrastive_loss": 0.704699695110321, "train/negative_loss": 0.7026187777519226, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.002080937847495079, "train/total_loss": 0.40599489212036133 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.29826709628105164, "train/contrastive_loss": 4.536911964416504, "train/negative_loss": 2.966407299041748, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.5705044269561768, "train/total_loss": 1.205649495124817 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.20360641181468964, "train/contrastive_loss": 1.3062645196914673, "train/negative_loss": 1.0606977939605713, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.24556677043437958, "train/total_loss": 0.4648593068122864 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.22966787219047546, "train/contrastive_loss": 3.801238536834717, "train/negative_loss": 2.7578775882720947, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.0433610677719116, "train/total_loss": 0.9899156093597412 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2880914807319641, "train/contrastive_loss": 1.2372689247131348, "train/negative_loss": 1.1856848001480103, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0515841506421566, "train/total_loss": 0.535545289516449 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2807157635688782, "train/contrastive_loss": 2.0164473056793213, "train/negative_loss": 2.014331102371216, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.0021161732729524374, "train/total_loss": 0.6840052604675293 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.27108246088027954, "train/contrastive_loss": 1.4438271522521973, "train/negative_loss": 1.2064590454101562, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.2373681366443634, "train/total_loss": 0.559847891330719 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.33205175399780273, "train/contrastive_loss": 2.6006836891174316, "train/negative_loss": 2.2137322425842285, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.38695135712623596, "train/total_loss": 0.8521885275840759 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.23320068418979645, "train/contrastive_loss": 2.6594433784484863, "train/negative_loss": 1.4917128086090088, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.167730450630188, "train/total_loss": 0.7650893330574036 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2598276436328888, "train/contrastive_loss": 1.8245913982391357, "train/negative_loss": 1.3977611064910889, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4268302321434021, "train/total_loss": 0.6247459650039673 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2979010343551636, "train/contrastive_loss": 2.5640647411346436, "train/negative_loss": 2.5639495849609375, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.00011516280210344121, "train/total_loss": 0.8107140064239502 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.23783941566944122, "train/contrastive_loss": 2.694197654724121, "train/negative_loss": 1.6137291193008423, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.0804685354232788, "train/total_loss": 0.7766789197921753 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2812771201133728, "train/contrastive_loss": 2.404744863510132, "train/negative_loss": 2.1674630641937256, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.23728182911872864, "train/total_loss": 0.7622261047363281 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2981731593608856, "train/contrastive_loss": 0.9076513051986694, "train/negative_loss": 0.8752302527427673, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.03242107480764389, "train/total_loss": 0.479703426361084 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.26617908477783203, "train/contrastive_loss": 1.1268925666809082, "train/negative_loss": 0.8994209170341492, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.22747159004211426, "train/total_loss": 0.49155759811401367 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.34852468967437744, "train/contrastive_loss": 2.451164722442627, "train/negative_loss": 2.0943233966827393, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.3568412661552429, "train/total_loss": 0.8387576341629028 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.21351921558380127, "train/contrastive_loss": 1.3077449798583984, "train/negative_loss": 1.2763208150863647, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.03142421320080757, "train/total_loss": 0.47506821155548096 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.22098085284233093, "train/contrastive_loss": 1.252382755279541, "train/negative_loss": 0.9320904612541199, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.32029226422309875, "train/total_loss": 0.47145742177963257 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.24900402128696442, "train/contrastive_loss": 1.5956631898880005, "train/negative_loss": 1.4973597526550293, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.09830348938703537, "train/total_loss": 0.5681366920471191 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2717909514904022, "train/contrastive_loss": 3.126350164413452, "train/negative_loss": 2.1042404174804688, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.0221097469329834, "train/total_loss": 0.8970609903335571 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.27638933062553406, "train/contrastive_loss": 2.0312418937683105, "train/negative_loss": 1.7461339235305786, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.2851078510284424, "train/total_loss": 0.6826376914978027 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.22918930649757385, "train/contrastive_loss": 0.6197246313095093, "train/negative_loss": 0.5883871912956238, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.03133746609091759, "train/total_loss": 0.35313424468040466 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.25562724471092224, "train/contrastive_loss": 2.7033188343048096, "train/negative_loss": 1.738297700881958, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.9650211334228516, "train/total_loss": 0.7962909936904907 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2959875464439392, "train/contrastive_loss": 2.5730886459350586, "train/negative_loss": 2.090815544128418, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.4822732210159302, "train/total_loss": 0.8106052875518799 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.20701751112937927, "train/contrastive_loss": 2.353665351867676, "train/negative_loss": 1.7266006469726562, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.62706458568573, "train/total_loss": 0.6777505874633789 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2567755877971649, "train/contrastive_loss": 2.0725317001342773, "train/negative_loss": 1.6104071140289307, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.46212470531463623, "train/total_loss": 0.6712819337844849 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2919117510318756, "train/contrastive_loss": 2.773078680038452, "train/negative_loss": 1.5652027130126953, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.2078759670257568, "train/total_loss": 0.8465274572372437 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.24964767694473267, "train/contrastive_loss": 4.710105895996094, "train/negative_loss": 4.71002721786499, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 7.888646359788254e-05, "train/total_loss": 1.1916688680648804 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.279945969581604, "train/contrastive_loss": 1.2637437582015991, "train/negative_loss": 1.243511438369751, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.020232265815138817, "train/total_loss": 0.5326946973800659 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.26825597882270813, "train/contrastive_loss": 2.8947269916534424, "train/negative_loss": 2.7786574363708496, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.11606947332620621, "train/total_loss": 0.8472013473510742 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.21056686341762543, "train/contrastive_loss": 1.890453815460205, "train/negative_loss": 1.755068063735962, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.13538573682308197, "train/total_loss": 0.5886576175689697 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2907728850841522, "train/contrastive_loss": 1.5807266235351562, "train/negative_loss": 1.4380918741226196, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.1426348090171814, "train/total_loss": 0.606918215751648 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.29031291604042053, "train/contrastive_loss": 1.907941460609436, "train/negative_loss": 1.5485501289367676, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.35939133167266846, "train/total_loss": 0.6719012260437012 }, { "epoch": 2.464788732394366, "eval_exact_match_accuracy": 0.08641975308641975, "eval_hamming_loss": 0.08828716671853927, "eval_loss": 0.7173317670822144, "eval_macro_f1": 0.03832151753209427, "eval_macro_precision": 0.052056220718375845, "eval_macro_recall": 0.030321406913280773, "eval_micro_f1": 0.19029495718363462, "eval_micro_precision": 0.8849557522123894, "eval_micro_recall": 0.10660980810234541, "eval_runtime": 2.8445, "eval_samples_per_second": 199.329, "eval_steps_per_second": 24.96, "step": 700 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.2534940540790558, "train/contrastive_loss": 1.2565116882324219, "train/negative_loss": 1.11784827709198, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.1386633664369583, "train/total_loss": 0.5047963857650757 }, { "epoch": 2.464788732394366, "step": 700, "train/classification_loss": 0.17683963477611542, "train/contrastive_loss": 1.7005207538604736, "train/negative_loss": 1.2565371990203857, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.4439835548400879, "train/total_loss": 0.5169438123703003 }, { "epoch": 2.640845070422535, "grad_norm": 12.585654258728027, "learning_rate": 1.990894996476392e-05, "loss": 1.07, "step": 750 }, { "epoch": 2.640845070422535, "step": 750, "train/classification_loss": 0.2328159660100937, "train/contrastive_loss": 1.05596923828125, "train/negative_loss": 0.9213714599609375, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.1345977932214737, "train/total_loss": 0.44400981068611145 }, { "epoch": 2.640845070422535, "step": 750, "train/classification_loss": 0.2837826907634735, "train/contrastive_loss": 1.1195340156555176, "train/negative_loss": 1.021483063697815, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.09805101156234741, "train/total_loss": 0.5076894760131836 }, { "epoch": 2.816901408450704, "grad_norm": 16.904903411865234, "learning_rate": 1.990190274841438e-05, "loss": 1.1083, "step": 800 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.25530996918678284, "train/contrastive_loss": 2.436138153076172, "train/negative_loss": 2.422919750213623, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.013218455947935581, "train/total_loss": 0.7425376176834106 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.3374779522418976, "train/contrastive_loss": 1.0352551937103271, "train/negative_loss": 1.0000343322753906, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.03522083908319473, "train/total_loss": 0.5445289611816406 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.28194302320480347, "train/contrastive_loss": 2.598475456237793, "train/negative_loss": 1.653485655784607, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.9449899196624756, "train/total_loss": 0.801638126373291 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.18934272229671478, "train/contrastive_loss": 1.750364065170288, "train/negative_loss": 1.53482186794281, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.21554219722747803, "train/total_loss": 0.5394155383110046 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.25565478205680847, "train/contrastive_loss": 3.2658021450042725, "train/negative_loss": 2.750257730484009, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.5155444741249084, "train/total_loss": 0.9088152647018433 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.26185911893844604, "train/contrastive_loss": 2.891963005065918, "train/negative_loss": 2.178420305252075, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.7135428190231323, "train/total_loss": 0.8402517437934875 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.24465319514274597, "train/contrastive_loss": 2.005976915359497, "train/negative_loss": 1.4147852659225464, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.5911916494369507, "train/total_loss": 0.6458485722541809 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2738387882709503, "train/contrastive_loss": 1.1176095008850098, "train/negative_loss": 1.1175786256790161, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 3.087568256887607e-05, "train/total_loss": 0.4973607063293457 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.21923665702342987, "train/contrastive_loss": 1.5575358867645264, "train/negative_loss": 1.2310187816619873, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.32651710510253906, "train/total_loss": 0.5307438373565674 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.27326807379722595, "train/contrastive_loss": 3.082857131958008, "train/negative_loss": 1.7860063314437866, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.2968506813049316, "train/total_loss": 0.8898395299911499 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.22566792368888855, "train/contrastive_loss": 1.2392702102661133, "train/negative_loss": 1.046807050704956, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.19246315956115723, "train/total_loss": 0.4735219478607178 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2538541853427887, "train/contrastive_loss": 1.246451735496521, "train/negative_loss": 1.2069483995437622, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.03950328752398491, "train/total_loss": 0.5031445026397705 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.25708866119384766, "train/contrastive_loss": 4.670703887939453, "train/negative_loss": 3.3335177898406982, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.3371858596801758, "train/total_loss": 1.1912294626235962 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.29008904099464417, "train/contrastive_loss": 2.7323391437530518, "train/negative_loss": 2.552006244659424, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.1803329586982727, "train/total_loss": 0.8365569114685059 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.18288853764533997, "train/contrastive_loss": 2.640139579772949, "train/negative_loss": 1.3435602188110352, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.296579360961914, "train/total_loss": 0.7109165191650391 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.25801247358322144, "train/contrastive_loss": 2.0654172897338867, "train/negative_loss": 1.4576373100280762, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.6077799201011658, "train/total_loss": 0.6710959672927856 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2303646057844162, "train/contrastive_loss": 1.7863417863845825, "train/negative_loss": 1.3515750169754028, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4347667992115021, "train/total_loss": 0.587632954120636 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.24760179221630096, "train/contrastive_loss": 2.480180263519287, "train/negative_loss": 2.380378484725952, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.09980181604623795, "train/total_loss": 0.7436378598213196 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.27540767192840576, "train/contrastive_loss": 2.197237253189087, "train/negative_loss": 2.103907346725464, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.093330018222332, "train/total_loss": 0.7148551344871521 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.21698682010173798, "train/contrastive_loss": 3.030367612838745, "train/negative_loss": 2.7388713359832764, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.29149627685546875, "train/total_loss": 0.8230603933334351 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.21215276420116425, "train/contrastive_loss": 1.6111845970153809, "train/negative_loss": 1.593361258506775, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.017823360860347748, "train/total_loss": 0.5343896746635437 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.19150559604167938, "train/contrastive_loss": 2.1677191257476807, "train/negative_loss": 2.014702796936035, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.15301623940467834, "train/total_loss": 0.6250494122505188 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2543528079986572, "train/contrastive_loss": 1.461971640586853, "train/negative_loss": 1.1034489870071411, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.3585226535797119, "train/total_loss": 0.5467471480369568 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.28685474395751953, "train/contrastive_loss": 2.5784759521484375, "train/negative_loss": 1.704355239868164, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.8741205930709839, "train/total_loss": 0.8025499582290649 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.25493335723876953, "train/contrastive_loss": 2.051750421524048, "train/negative_loss": 1.2813271284103394, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.7704232931137085, "train/total_loss": 0.6652834415435791 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.24819374084472656, "train/contrastive_loss": 1.961195945739746, "train/negative_loss": 1.8431615829467773, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.11803442239761353, "train/total_loss": 0.6404329538345337 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2704271674156189, "train/contrastive_loss": 2.840777635574341, "train/negative_loss": 2.760887622833252, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.07989010959863663, "train/total_loss": 0.8385826945304871 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.26017406582832336, "train/contrastive_loss": 0.879958987236023, "train/negative_loss": 0.8019862771034241, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.07797269523143768, "train/total_loss": 0.43616586923599243 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.26372599601745605, "train/contrastive_loss": 3.3286662101745605, "train/negative_loss": 2.2956743240356445, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.0329917669296265, "train/total_loss": 0.929459273815155 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2945454716682434, "train/contrastive_loss": 1.7435551881790161, "train/negative_loss": 1.708172082901001, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.03538309410214424, "train/total_loss": 0.6432565450668335 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2104320377111435, "train/contrastive_loss": 1.5684928894042969, "train/negative_loss": 1.5593011379241943, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.009191783145070076, "train/total_loss": 0.524130642414093 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.23950229585170746, "train/contrastive_loss": 3.3051068782806396, "train/negative_loss": 2.5042731761932373, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.8008337020874023, "train/total_loss": 0.9005237221717834 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.24864685535430908, "train/contrastive_loss": 2.874927520751953, "train/negative_loss": 1.861314296722412, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.013613224029541, "train/total_loss": 0.8236323595046997 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.26860445737838745, "train/contrastive_loss": 2.1972618103027344, "train/negative_loss": 2.1391520500183105, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.05810968205332756, "train/total_loss": 0.7080568075180054 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2958243787288666, "train/contrastive_loss": 2.8103344440460205, "train/negative_loss": 2.4228763580322266, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.38745805621147156, "train/total_loss": 0.857891321182251 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.1951732039451599, "train/contrastive_loss": 2.352726697921753, "train/negative_loss": 2.095808267593384, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.2569184899330139, "train/total_loss": 0.6657185554504395 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.264277845621109, "train/contrastive_loss": 1.8340411186218262, "train/negative_loss": 1.7576637268066406, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.07637742906808853, "train/total_loss": 0.6310861110687256 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.32850220799446106, "train/contrastive_loss": 3.4041428565979004, "train/negative_loss": 3.388155460357666, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.01598750427365303, "train/total_loss": 1.0093307495117188 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2550434172153473, "train/contrastive_loss": 1.6375336647033691, "train/negative_loss": 1.6250334978103638, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.012500218115746975, "train/total_loss": 0.5825501680374146 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.291134774684906, "train/contrastive_loss": 3.782825231552124, "train/negative_loss": 3.4734084606170654, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 0.30941683053970337, "train/total_loss": 1.0476998090744019 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.19983667135238647, "train/contrastive_loss": 1.3478055000305176, "train/negative_loss": 1.2320120334625244, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.11579342186450958, "train/total_loss": 0.46939778327941895 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.22298429906368256, "train/contrastive_loss": 3.5381340980529785, "train/negative_loss": 2.65381121635437, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.8843229413032532, "train/total_loss": 0.9306111335754395 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.28030794858932495, "train/contrastive_loss": 1.4580556154251099, "train/negative_loss": 1.4495916366577148, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.008464016020298004, "train/total_loss": 0.5719190835952759 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.27817320823669434, "train/contrastive_loss": 1.6760679483413696, "train/negative_loss": 1.6634886264801025, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.012579305097460747, "train/total_loss": 0.6133868098258972 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2633680999279022, "train/contrastive_loss": 2.0351154804229736, "train/negative_loss": 1.8000682592391968, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.23504719138145447, "train/total_loss": 0.6703912019729614 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.3214731812477112, "train/contrastive_loss": 3.6920042037963867, "train/negative_loss": 3.0195672512054443, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.6724368333816528, "train/total_loss": 1.0598740577697754 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.22473084926605225, "train/contrastive_loss": 2.4874930381774902, "train/negative_loss": 1.979832649230957, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.507660448551178, "train/total_loss": 0.7222294807434082 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2553084194660187, "train/contrastive_loss": 1.3869521617889404, "train/negative_loss": 1.161912202835083, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.22503989934921265, "train/total_loss": 0.5326988697052002 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2978564202785492, "train/contrastive_loss": 2.9334352016448975, "train/negative_loss": 2.933372974395752, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 6.210996798472479e-05, "train/total_loss": 0.8845434188842773 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.23521746695041656, "train/contrastive_loss": 2.9775519371032715, "train/negative_loss": 2.2168920040130615, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.7606600522994995, "train/total_loss": 0.8307278752326965 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.26708418130874634, "train/contrastive_loss": 2.4387190341949463, "train/negative_loss": 2.3446977138519287, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.09402133524417877, "train/total_loss": 0.7548279762268066 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.29026615619659424, "train/contrastive_loss": 0.9986672401428223, "train/negative_loss": 0.9358220100402832, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.06284521520137787, "train/total_loss": 0.48999959230422974 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2614245116710663, "train/contrastive_loss": 1.0351309776306152, "train/negative_loss": 0.9160920977592468, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.1190388947725296, "train/total_loss": 0.46845072507858276 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.3408012390136719, "train/contrastive_loss": 2.7718424797058105, "train/negative_loss": 2.7475712299346924, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.02427135780453682, "train/total_loss": 0.895169734954834 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.20949704945087433, "train/contrastive_loss": 1.3126007318496704, "train/negative_loss": 1.0364757776260376, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.2761249542236328, "train/total_loss": 0.47201722860336304 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.21531300246715546, "train/contrastive_loss": 1.5455608367919922, "train/negative_loss": 1.2875653505325317, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.25799551606178284, "train/total_loss": 0.5244251489639282 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.24157361686229706, "train/contrastive_loss": 1.898134469985962, "train/negative_loss": 1.511379599571228, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.3867548704147339, "train/total_loss": 0.6212005019187927 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2620825171470642, "train/contrastive_loss": 2.258037567138672, "train/negative_loss": 1.6570624113082886, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.6009751558303833, "train/total_loss": 0.7136900424957275 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2702169120311737, "train/contrastive_loss": 3.007739305496216, "train/negative_loss": 2.9511866569519043, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.05655274540185928, "train/total_loss": 0.8717647790908813 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.21575193107128143, "train/contrastive_loss": 0.4348738491535187, "train/negative_loss": 0.42594432830810547, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.008929528295993805, "train/total_loss": 0.302726686000824 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.24968865513801575, "train/contrastive_loss": 2.4363017082214355, "train/negative_loss": 1.8530491590499878, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.5832524299621582, "train/total_loss": 0.7369489669799805 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.29271823167800903, "train/contrastive_loss": 2.594679117202759, "train/negative_loss": 2.2339677810668945, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.3607114255428314, "train/total_loss": 0.8116540908813477 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.20150186121463776, "train/contrastive_loss": 2.305906295776367, "train/negative_loss": 1.461719036102295, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.8441872000694275, "train/total_loss": 0.6626831293106079 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2527795135974884, "train/contrastive_loss": 2.8478028774261475, "train/negative_loss": 2.579000234603882, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.26880255341529846, "train/total_loss": 0.8223401308059692 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.27862924337387085, "train/contrastive_loss": 1.8087778091430664, "train/negative_loss": 1.5379607677459717, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.2708171010017395, "train/total_loss": 0.6403847932815552 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.24101270735263824, "train/contrastive_loss": 4.855133533477783, "train/negative_loss": 4.8550944328308105, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 3.922153700841591e-05, "train/total_loss": 1.2120394706726074 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2651229798793793, "train/contrastive_loss": 1.641740083694458, "train/negative_loss": 1.5914775133132935, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.05026261880993843, "train/total_loss": 0.5934709906578064 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2658005952835083, "train/contrastive_loss": 2.2454192638397217, "train/negative_loss": 1.7501306533813477, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.4952886998653412, "train/total_loss": 0.7148844599723816 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2068278044462204, "train/contrastive_loss": 2.4670262336730957, "train/negative_loss": 2.3775181770324707, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.08950802683830261, "train/total_loss": 0.7002330422401428 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.28742626309394836, "train/contrastive_loss": 2.058751106262207, "train/negative_loss": 1.9918733835220337, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.0668778270483017, "train/total_loss": 0.6991764903068542 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2809467315673828, "train/contrastive_loss": 2.4301342964172363, "train/negative_loss": 2.245181083679199, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.18495316803455353, "train/total_loss": 0.766973614692688 }, { "epoch": 2.816901408450704, "eval_exact_match_accuracy": 0.07583774250440917, "eval_hamming_loss": 0.08828716671853927, "eval_loss": 0.7093353271484375, "eval_macro_f1": 0.039402468066681094, "eval_macro_precision": 0.11255656108597284, "eval_macro_recall": 0.02976965672190796, "eval_micro_f1": 0.1840843720038351, "eval_micro_precision": 0.9142857142857143, "eval_micro_recall": 0.1023454157782516, "eval_runtime": 2.8396, "eval_samples_per_second": 199.677, "eval_steps_per_second": 25.004, "step": 800 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.252003937959671, "train/contrastive_loss": 1.3974590301513672, "train/negative_loss": 0.8496163487434387, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.5478426814079285, "train/total_loss": 0.5314957499504089 }, { "epoch": 2.816901408450704, "step": 800, "train/classification_loss": 0.2942037880420685, "train/contrastive_loss": 1.0723258256912231, "train/negative_loss": 0.9051344990730286, "train/num_negatives": 42, "train/num_positives": 6, "train/positive_loss": 0.16719137132167816, "train/total_loss": 0.5086689591407776 }, { "epoch": 2.992957746478873, "grad_norm": 9.401230812072754, "learning_rate": 1.9894855532064835e-05, "loss": 1.0828, "step": 850 }, { "epoch": 2.992957746478873, "step": 850, "train/classification_loss": 0.27011895179748535, "train/contrastive_loss": 1.1434996128082275, "train/negative_loss": 0.8881341814994812, "train/num_negatives": 38, "train/num_positives": 18, "train/positive_loss": 0.2553654611110687, "train/total_loss": 0.49881887435913086 }, { "epoch": 2.992957746478873, "step": 850, "train/classification_loss": 0.2618882954120636, "train/contrastive_loss": 0.9530047178268433, "train/negative_loss": 0.7438822984695435, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.2091224193572998, "train/total_loss": 0.4524892568588257 }, { "epoch": 3.169014084507042, "grad_norm": 12.180469512939453, "learning_rate": 1.9887808315715293e-05, "loss": 1.0268, "step": 900 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.25358226895332336, "train/contrastive_loss": 1.9923863410949707, "train/negative_loss": 1.7963001728057861, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.1960861086845398, "train/total_loss": 0.6520595550537109 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.33721333742141724, "train/contrastive_loss": 1.2469919919967651, "train/negative_loss": 1.0868885517120361, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.1601034700870514, "train/total_loss": 0.5866117477416992 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2690930664539337, "train/contrastive_loss": 2.7295455932617188, "train/negative_loss": 1.2594517469406128, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.4700939655303955, "train/total_loss": 0.8150022029876709 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.18621936440467834, "train/contrastive_loss": 1.6868665218353271, "train/negative_loss": 1.5004374980926514, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.18642906844615936, "train/total_loss": 0.5235927104949951 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2418345808982849, "train/contrastive_loss": 3.0100104808807373, "train/negative_loss": 2.782055139541626, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.22795523703098297, "train/total_loss": 0.8438366651535034 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.25583726167678833, "train/contrastive_loss": 2.327380418777466, "train/negative_loss": 1.7409801483154297, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.5864002704620361, "train/total_loss": 0.7213133573532104 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2349979132413864, "train/contrastive_loss": 1.4303185939788818, "train/negative_loss": 0.9587671756744385, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.47155144810676575, "train/total_loss": 0.5210616588592529 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2661401629447937, "train/contrastive_loss": 0.7526309490203857, "train/negative_loss": 0.7526141405105591, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 1.6808651707833633e-05, "train/total_loss": 0.4166663587093353 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.20879028737545013, "train/contrastive_loss": 0.8466865420341492, "train/negative_loss": 0.8190524578094482, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.027634065598249435, "train/total_loss": 0.3781276047229767 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.270837664604187, "train/contrastive_loss": 3.236480712890625, "train/negative_loss": 2.2038185596466064, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.032662034034729, "train/total_loss": 0.9181337952613831 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.21749143302440643, "train/contrastive_loss": 1.2317242622375488, "train/negative_loss": 1.160201072692871, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.07152324914932251, "train/total_loss": 0.46383628249168396 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2534635663032532, "train/contrastive_loss": 1.7865002155303955, "train/negative_loss": 1.6147598028182983, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.17174047231674194, "train/total_loss": 0.6107636094093323 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2502749264240265, "train/contrastive_loss": 4.4567742347717285, "train/negative_loss": 2.673809051513672, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.7829651832580566, "train/total_loss": 1.1416298151016235 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.27925580739974976, "train/contrastive_loss": 1.762145757675171, "train/negative_loss": 1.72877037525177, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.033375371247529984, "train/total_loss": 0.6316849589347839 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.17603686451911926, "train/contrastive_loss": 2.4854531288146973, "train/negative_loss": 1.1680917739868164, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.3173613548278809, "train/total_loss": 0.6731275320053101 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.24764235317707062, "train/contrastive_loss": 1.7742722034454346, "train/negative_loss": 0.775140643119812, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.9991315007209778, "train/total_loss": 0.6024968028068542 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.21514207124710083, "train/contrastive_loss": 1.61635160446167, "train/negative_loss": 1.422782063484192, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.19356957077980042, "train/total_loss": 0.5384123921394348 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2396659255027771, "train/contrastive_loss": 2.763972043991089, "train/negative_loss": 2.73207688331604, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.03189517930150032, "train/total_loss": 0.7924603223800659 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2650146186351776, "train/contrastive_loss": 2.48262357711792, "train/negative_loss": 2.475081205368042, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.007542412728071213, "train/total_loss": 0.7615393400192261 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.21354293823242188, "train/contrastive_loss": 2.597524881362915, "train/negative_loss": 2.4310214519500732, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.16650345921516418, "train/total_loss": 0.7330479025840759 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.20551535487174988, "train/contrastive_loss": 1.978804588317871, "train/negative_loss": 1.85262131690979, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.12618324160575867, "train/total_loss": 0.6012762784957886 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.18886318802833557, "train/contrastive_loss": 2.2895596027374268, "train/negative_loss": 2.266066789627075, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.023492876440286636, "train/total_loss": 0.6467751264572144 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2466670721769333, "train/contrastive_loss": 1.8031994104385376, "train/negative_loss": 1.6978203058242798, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.105379119515419, "train/total_loss": 0.607306957244873 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2870582640171051, "train/contrastive_loss": 2.804509162902832, "train/negative_loss": 1.702981948852539, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.1015270948410034, "train/total_loss": 0.8479601144790649 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.24687239527702332, "train/contrastive_loss": 1.1275032758712769, "train/negative_loss": 0.9102397561073303, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.21726350486278534, "train/total_loss": 0.4723730683326721 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.23745234310626984, "train/contrastive_loss": 2.7406063079833984, "train/negative_loss": 2.04325532913208, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.6973509192466736, "train/total_loss": 0.7855736017227173 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.26930058002471924, "train/contrastive_loss": 2.458677053451538, "train/negative_loss": 2.4018378257751465, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.056839242577552795, "train/total_loss": 0.7610360383987427 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2535470426082611, "train/contrastive_loss": 1.8438407182693481, "train/negative_loss": 1.6169536113739014, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.22688713669776917, "train/total_loss": 0.6223151683807373 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2579350769519806, "train/contrastive_loss": 3.7865653038024902, "train/negative_loss": 1.6754318475723267, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 2.111133337020874, "train/total_loss": 1.01524817943573 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2838534116744995, "train/contrastive_loss": 1.2872849702835083, "train/negative_loss": 1.2478972673416138, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.03938775882124901, "train/total_loss": 0.5413104295730591 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2081357091665268, "train/contrastive_loss": 2.1145899295806885, "train/negative_loss": 2.11407470703125, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0005153264501132071, "train/total_loss": 0.6310536861419678 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.23127244412899017, "train/contrastive_loss": 2.789837598800659, "train/negative_loss": 2.005688428878784, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.7841491103172302, "train/total_loss": 0.7892400026321411 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2362528145313263, "train/contrastive_loss": 1.9099745750427246, "train/negative_loss": 1.3928916454315186, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.5170829892158508, "train/total_loss": 0.6182477474212646 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.259905606508255, "train/contrastive_loss": 1.8167695999145508, "train/negative_loss": 1.674485206604004, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.14228445291519165, "train/total_loss": 0.6232595443725586 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.28814688324928284, "train/contrastive_loss": 2.8386669158935547, "train/negative_loss": 2.108210802078247, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.7304562330245972, "train/total_loss": 0.8558802604675293 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.18821392953395844, "train/contrastive_loss": 1.8747836351394653, "train/negative_loss": 1.8118003606796265, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.06298328191041946, "train/total_loss": 0.5631706714630127 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.26654890179634094, "train/contrastive_loss": 1.9006266593933105, "train/negative_loss": 1.1798664331436157, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.7207602262496948, "train/total_loss": 0.6466742753982544 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.319775253534317, "train/contrastive_loss": 1.3892217874526978, "train/negative_loss": 1.3537771701812744, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.035444606095552444, "train/total_loss": 0.5976196527481079 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.24637575447559357, "train/contrastive_loss": 0.6561765670776367, "train/negative_loss": 0.6435545682907104, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.012622025795280933, "train/total_loss": 0.37761107087135315 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2969827950000763, "train/contrastive_loss": 3.5329229831695557, "train/negative_loss": 2.3411078453063965, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.1918151378631592, "train/total_loss": 1.0035674571990967 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.18902000784873962, "train/contrastive_loss": 0.9614936113357544, "train/negative_loss": 0.7187949419021606, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.24269866943359375, "train/total_loss": 0.38131874799728394 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2200397104024887, "train/contrastive_loss": 3.7696337699890137, "train/negative_loss": 3.1244354248046875, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.6451984643936157, "train/total_loss": 0.9739664793014526 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.27559593319892883, "train/contrastive_loss": 1.152921438217163, "train/negative_loss": 1.1186774969100952, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.03424391895532608, "train/total_loss": 0.5061802268028259 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.28067702054977417, "train/contrastive_loss": 1.3491246700286865, "train/negative_loss": 1.0117920637130737, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.337332546710968, "train/total_loss": 0.5505019426345825 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.25605034828186035, "train/contrastive_loss": 1.8900290727615356, "train/negative_loss": 1.779759407043457, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.11026965826749802, "train/total_loss": 0.6340562105178833 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.31310468912124634, "train/contrastive_loss": 2.294672966003418, "train/negative_loss": 1.685768723487854, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.6089043021202087, "train/total_loss": 0.7720392942428589 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.22021882236003876, "train/contrastive_loss": 2.3119664192199707, "train/negative_loss": 1.7251931428909302, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.5867732167243958, "train/total_loss": 0.6826121211051941 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2507193088531494, "train/contrastive_loss": 1.7474128007888794, "train/negative_loss": 1.2832971811294556, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4641156494617462, "train/total_loss": 0.6002018451690674 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.29070261120796204, "train/contrastive_loss": 3.328002452850342, "train/negative_loss": 3.3279781341552734, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 2.4318991563632153e-05, "train/total_loss": 0.9563031196594238 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.22610525786876678, "train/contrastive_loss": 2.796560049057007, "train/negative_loss": 1.909249186515808, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.8873108625411987, "train/total_loss": 0.7854173183441162 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.25967052578926086, "train/contrastive_loss": 2.43886137008667, "train/negative_loss": 2.076239824295044, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.3626216650009155, "train/total_loss": 0.7474428415298462 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2802373766899109, "train/contrastive_loss": 0.8633297681808472, "train/negative_loss": 0.6441264152526855, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.21920333802700043, "train/total_loss": 0.4529033303260803 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2545483112335205, "train/contrastive_loss": 1.4053995609283447, "train/negative_loss": 1.0480958223342896, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.3573037385940552, "train/total_loss": 0.5356281995773315 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.3251075744628906, "train/contrastive_loss": 1.5251171588897705, "train/negative_loss": 1.2969127893447876, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.2282043993473053, "train/total_loss": 0.6301310062408447 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.20154227316379547, "train/contrastive_loss": 0.8990278840065002, "train/negative_loss": 0.8234050273895264, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.07562287896871567, "train/total_loss": 0.3813478350639343 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.20155936479568481, "train/contrastive_loss": 1.091333031654358, "train/negative_loss": 0.9378836154937744, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.15344937145709991, "train/total_loss": 0.4198259711265564 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.23542320728302002, "train/contrastive_loss": 1.8291407823562622, "train/negative_loss": 1.4410908222198486, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.38804998993873596, "train/total_loss": 0.6012513637542725 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.25759339332580566, "train/contrastive_loss": 2.8283519744873047, "train/negative_loss": 1.410085678100586, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.4182664155960083, "train/total_loss": 0.8232638239860535 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2626960575580597, "train/contrastive_loss": 2.476795196533203, "train/negative_loss": 2.470823287963867, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.0059718117117881775, "train/total_loss": 0.7580550909042358 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.20553740859031677, "train/contrastive_loss": 0.3179081082344055, "train/negative_loss": 0.2770361602306366, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.04087194427847862, "train/total_loss": 0.2691190242767334 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.24472014605998993, "train/contrastive_loss": 3.0500593185424805, "train/negative_loss": 2.091676950454712, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.958382248878479, "train/total_loss": 0.8547320365905762 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.293016254901886, "train/contrastive_loss": 2.809427261352539, "train/negative_loss": 1.9499094486236572, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.8595178127288818, "train/total_loss": 0.8549017310142517 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.19498024880886078, "train/contrastive_loss": 1.9063409566879272, "train/negative_loss": 1.4219688177108765, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.4843721389770508, "train/total_loss": 0.5762484669685364 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.24755001068115234, "train/contrastive_loss": 2.495579242706299, "train/negative_loss": 2.300785779953003, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.19479335844516754, "train/total_loss": 0.7466658353805542 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2649572491645813, "train/contrastive_loss": 1.0680320262908936, "train/negative_loss": 0.9751583933830261, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.09287359565496445, "train/total_loss": 0.47856366634368896 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.23454870283603668, "train/contrastive_loss": 5.323813438415527, "train/negative_loss": 5.323805809020996, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 7.486403319489909e-06, "train/total_loss": 1.2993113994598389 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.25739285349845886, "train/contrastive_loss": 1.1266157627105713, "train/negative_loss": 0.8640680909156799, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.26254770159721375, "train/total_loss": 0.48271602392196655 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2637128531932831, "train/contrastive_loss": 1.78715181350708, "train/negative_loss": 1.5449166297912598, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.24223516881465912, "train/total_loss": 0.6211432218551636 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.200800359249115, "train/contrastive_loss": 2.5807042121887207, "train/negative_loss": 1.5696772336959839, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.0110269784927368, "train/total_loss": 0.716941237449646 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2878514528274536, "train/contrastive_loss": 1.995542287826538, "train/negative_loss": 1.9333635568618774, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.06217879056930542, "train/total_loss": 0.6869599223136902 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2737419307231903, "train/contrastive_loss": 4.395015716552734, "train/negative_loss": 3.087554931640625, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 1.307460904121399, "train/total_loss": 1.1527451276779175 }, { "epoch": 3.169014084507042, "eval_exact_match_accuracy": 0.10405643738977072, "eval_hamming_loss": 0.08621226268285091, "eval_loss": 0.673316478729248, "eval_macro_f1": 0.06435205817060254, "eval_macro_precision": 0.16397058823529412, "eval_macro_recall": 0.051660252363578525, "eval_micro_f1": 0.25336927223719674, "eval_micro_precision": 0.8057142857142857, "eval_micro_recall": 0.15031982942430705, "eval_runtime": 2.8568, "eval_samples_per_second": 198.473, "eval_steps_per_second": 24.853, "step": 900 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.2628500759601593, "train/contrastive_loss": 1.3113716840744019, "train/negative_loss": 1.305722951889038, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 0.005648748017847538, "train/total_loss": 0.5251244306564331 }, { "epoch": 3.169014084507042, "step": 900, "train/classification_loss": 0.21615852415561676, "train/contrastive_loss": 0.9258386492729187, "train/negative_loss": 0.7519519925117493, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.17388665676116943, "train/total_loss": 0.4013262391090393 }, { "epoch": 3.345070422535211, "grad_norm": 19.28108787536621, "learning_rate": 1.988076109936575e-05, "loss": 1.0389, "step": 950 }, { "epoch": 3.345070422535211, "step": 950, "train/classification_loss": 0.2880273461341858, "train/contrastive_loss": 2.0527405738830566, "train/negative_loss": 1.7265995740890503, "train/num_negatives": 40, "train/num_positives": 4, "train/positive_loss": 0.3261411190032959, "train/total_loss": 0.698575496673584 }, { "epoch": 3.345070422535211, "step": 950, "train/classification_loss": 0.2285711169242859, "train/contrastive_loss": 0.9377437829971313, "train/negative_loss": 0.8507233262062073, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.08702044188976288, "train/total_loss": 0.41611987352371216 }, { "epoch": 3.52112676056338, "grad_norm": 15.228022575378418, "learning_rate": 1.987371388301621e-05, "loss": 1.0161, "step": 1000 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.24659588932991028, "train/contrastive_loss": 2.060753107070923, "train/negative_loss": 1.508183479309082, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.5525696873664856, "train/total_loss": 0.6587464809417725 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.3281591534614563, "train/contrastive_loss": 1.4071173667907715, "train/negative_loss": 0.6819202303886414, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.7251971960067749, "train/total_loss": 0.6095826625823975 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2778911888599396, "train/contrastive_loss": 3.0015885829925537, "train/negative_loss": 1.6918468475341797, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.309741735458374, "train/total_loss": 0.8782088756561279 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.1679188311100006, "train/contrastive_loss": 1.164793848991394, "train/negative_loss": 1.0715124607086182, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.09328135848045349, "train/total_loss": 0.40087759494781494 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2491820901632309, "train/contrastive_loss": 2.691622495651245, "train/negative_loss": 2.2680039405822754, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.42361846566200256, "train/total_loss": 0.787506639957428 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2490396499633789, "train/contrastive_loss": 3.1627893447875977, "train/negative_loss": 1.8857285976409912, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.2770607471466064, "train/total_loss": 0.8815975189208984 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2303515374660492, "train/contrastive_loss": 2.1189987659454346, "train/negative_loss": 1.2774397134780884, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.8415589928627014, "train/total_loss": 0.6541513204574585 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.25099775195121765, "train/contrastive_loss": 1.2132492065429688, "train/negative_loss": 1.2132288217544556, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 2.0384995877975598e-05, "train/total_loss": 0.49364757537841797 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.18784703314304352, "train/contrastive_loss": 0.7816201448440552, "train/negative_loss": 0.46114498376846313, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.32047513127326965, "train/total_loss": 0.34417104721069336 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2678319215774536, "train/contrastive_loss": 3.3326683044433594, "train/negative_loss": 1.8832197189331055, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.4494484663009644, "train/total_loss": 0.9343655705451965 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2084895223379135, "train/contrastive_loss": 1.2625449895858765, "train/negative_loss": 1.0778404474258423, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.18470454216003418, "train/total_loss": 0.46099853515625 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2397947907447815, "train/contrastive_loss": 1.2310004234313965, "train/negative_loss": 1.2204564809799194, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.010543959215283394, "train/total_loss": 0.4859948754310608 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2481394112110138, "train/contrastive_loss": 4.0711164474487305, "train/negative_loss": 2.1748838424682617, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.8962326049804688, "train/total_loss": 1.0623626708984375 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.278243750333786, "train/contrastive_loss": 1.6890828609466553, "train/negative_loss": 1.6558380126953125, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.03324489668011665, "train/total_loss": 0.6160603165626526 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.17101134359836578, "train/contrastive_loss": 2.4853248596191406, "train/negative_loss": 1.0175129175186157, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.467811942100525, "train/total_loss": 0.6680763363838196 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.23633305728435516, "train/contrastive_loss": 1.3315913677215576, "train/negative_loss": 0.9168295860290527, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.41476184129714966, "train/total_loss": 0.5026513338088989 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.20215222239494324, "train/contrastive_loss": 1.2464224100112915, "train/negative_loss": 0.9159505367279053, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.3304719030857086, "train/total_loss": 0.45143669843673706 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.23914499580860138, "train/contrastive_loss": 2.2031474113464355, "train/negative_loss": 1.9642727375030518, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.23887477815151215, "train/total_loss": 0.6797744631767273 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2514301836490631, "train/contrastive_loss": 1.0630979537963867, "train/negative_loss": 1.0438395738601685, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.019258422777056694, "train/total_loss": 0.464049756526947 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2085026204586029, "train/contrastive_loss": 2.897691249847412, "train/negative_loss": 2.0091145038604736, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8885766863822937, "train/total_loss": 0.7880408763885498 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.19692005217075348, "train/contrastive_loss": 1.5920015573501587, "train/negative_loss": 1.1873434782028198, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.4046580493450165, "train/total_loss": 0.515320360660553 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.177629753947258, "train/contrastive_loss": 3.0995242595672607, "train/negative_loss": 2.2610092163085938, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8385149836540222, "train/total_loss": 0.7975346446037292 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.23684047162532806, "train/contrastive_loss": 1.7231837511062622, "train/negative_loss": 1.2479214668273926, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.47526228427886963, "train/total_loss": 0.5814772248268127 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2805205285549164, "train/contrastive_loss": 2.201094150543213, "train/negative_loss": 1.3151105642318726, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.8859834671020508, "train/total_loss": 0.7207393646240234 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.23459100723266602, "train/contrastive_loss": 2.1292617321014404, "train/negative_loss": 0.8994188904762268, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.2298427820205688, "train/total_loss": 0.6604433655738831 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.23213499784469604, "train/contrastive_loss": 2.771615743637085, "train/negative_loss": 2.22808575630188, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.5435300469398499, "train/total_loss": 0.7864581346511841 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.25737622380256653, "train/contrastive_loss": 1.7168982028961182, "train/negative_loss": 1.7139739990234375, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0029241731390357018, "train/total_loss": 0.6007558703422546 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.24245132505893707, "train/contrastive_loss": 0.5793294906616211, "train/negative_loss": 0.5424954891204834, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.03683401271700859, "train/total_loss": 0.35831722617149353 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2571668028831482, "train/contrastive_loss": 3.6397993564605713, "train/negative_loss": 1.5242211818695068, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 2.1155781745910645, "train/total_loss": 0.9851266741752625 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2782219648361206, "train/contrastive_loss": 0.9946987628936768, "train/negative_loss": 0.9718318581581116, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.02286689728498459, "train/total_loss": 0.477161705493927 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.20099972188472748, "train/contrastive_loss": 1.7147216796875, "train/negative_loss": 1.6883797645568848, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.02634197100996971, "train/total_loss": 0.5439440608024597 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.22822096943855286, "train/contrastive_loss": 3.840061664581299, "train/negative_loss": 2.472417116165161, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.3676444292068481, "train/total_loss": 0.996233344078064 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2354201376438141, "train/contrastive_loss": 2.713012933731079, "train/negative_loss": 2.1191723346710205, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.5938405394554138, "train/total_loss": 0.7780227661132812 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.25253626704216003, "train/contrastive_loss": 1.547911524772644, "train/negative_loss": 1.4815728664398193, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.0663386881351471, "train/total_loss": 0.5621185898780823 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2873808741569519, "train/contrastive_loss": 3.0936532020568848, "train/negative_loss": 2.072852373123169, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.0208008289337158, "train/total_loss": 0.9061115384101868 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.1729366034269333, "train/contrastive_loss": 1.9159187078475952, "train/negative_loss": 1.8947396278381348, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.021179111674427986, "train/total_loss": 0.5561203360557556 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.25718632340431213, "train/contrastive_loss": 1.9518499374389648, "train/negative_loss": 0.9657573103904724, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.9860926270484924, "train/total_loss": 0.6475563049316406 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.30859431624412537, "train/contrastive_loss": 2.0318307876586914, "train/negative_loss": 1.8518718481063843, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.1799589991569519, "train/total_loss": 0.7149604558944702 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2361467033624649, "train/contrastive_loss": 0.563295841217041, "train/negative_loss": 0.4943731129169464, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.06892272084951401, "train/total_loss": 0.34880587458610535 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2919042408466339, "train/contrastive_loss": 3.4503490924835205, "train/negative_loss": 2.130063056945801, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.3202860355377197, "train/total_loss": 0.9819741249084473 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.1812683790922165, "train/contrastive_loss": 0.7683617472648621, "train/negative_loss": 0.6469441652297974, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.1214175820350647, "train/total_loss": 0.33494073152542114 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2186700701713562, "train/contrastive_loss": 3.6752686500549316, "train/negative_loss": 2.2658612728118896, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.4094072580337524, "train/total_loss": 0.9537237882614136 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2589084506034851, "train/contrastive_loss": 0.94645094871521, "train/negative_loss": 0.945676863193512, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0007741086883470416, "train/total_loss": 0.4481986463069916 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2766871154308319, "train/contrastive_loss": 1.231074333190918, "train/negative_loss": 1.220503330230713, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.010571012273430824, "train/total_loss": 0.5229020118713379 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.24836365878582, "train/contrastive_loss": 1.3828072547912598, "train/negative_loss": 1.3475455045700073, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.03526173159480095, "train/total_loss": 0.5249251127243042 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.3172628879547119, "train/contrastive_loss": 3.442688465118408, "train/negative_loss": 2.3860249519348145, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.0566633939743042, "train/total_loss": 1.0058006048202515 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.21261222660541534, "train/contrastive_loss": 1.6953009366989136, "train/negative_loss": 1.269429326057434, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.4258715808391571, "train/total_loss": 0.5516723990440369 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.23725734651088715, "train/contrastive_loss": 2.443549394607544, "train/negative_loss": 1.7813152074813843, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.6622342467308044, "train/total_loss": 0.7259672284126282 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2844632863998413, "train/contrastive_loss": 2.510272979736328, "train/negative_loss": 2.509378671646118, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.0008944099536165595, "train/total_loss": 0.7865179181098938 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.21981112658977509, "train/contrastive_loss": 2.5818116664886475, "train/negative_loss": 1.5117744207382202, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.0700372457504272, "train/total_loss": 0.7361735105514526 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2378627061843872, "train/contrastive_loss": 1.1071714162826538, "train/negative_loss": 0.8405683040618896, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.2666030824184418, "train/total_loss": 0.4592970013618469 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2751213312149048, "train/contrastive_loss": 0.8608742952346802, "train/negative_loss": 0.6029313206672668, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.25794294476509094, "train/total_loss": 0.4472962021827698 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.24389474093914032, "train/contrastive_loss": 1.2948613166809082, "train/negative_loss": 0.709494411945343, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.5853668451309204, "train/total_loss": 0.5028669834136963 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.3243478238582611, "train/contrastive_loss": 1.8313242197036743, "train/negative_loss": 1.7057645320892334, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.12555965781211853, "train/total_loss": 0.6906126737594604 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.18626669049263, "train/contrastive_loss": 1.1465792655944824, "train/negative_loss": 1.0097198486328125, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.13685943186283112, "train/total_loss": 0.415582537651062 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.18911504745483398, "train/contrastive_loss": 1.2773925065994263, "train/negative_loss": 0.5432942509651184, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.7340982556343079, "train/total_loss": 0.44459354877471924 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.22916723787784576, "train/contrastive_loss": 1.9191935062408447, "train/negative_loss": 1.0063399076461792, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.9128535389900208, "train/total_loss": 0.6130059361457825 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2522820830345154, "train/contrastive_loss": 2.130955219268799, "train/negative_loss": 1.295016884803772, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.8359382152557373, "train/total_loss": 0.6784731149673462 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2548275589942932, "train/contrastive_loss": 1.3030062913894653, "train/negative_loss": 1.2422012090682983, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.06080511212348938, "train/total_loss": 0.5154287815093994 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.20139287412166595, "train/contrastive_loss": 0.4285404682159424, "train/negative_loss": 0.3663267195224762, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.062213748693466187, "train/total_loss": 0.28710097074508667 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.24033991992473602, "train/contrastive_loss": 2.683631181716919, "train/negative_loss": 1.7628206014633179, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.9208105206489563, "train/total_loss": 0.777066171169281 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.295841783285141, "train/contrastive_loss": 3.220322608947754, "train/negative_loss": 1.9369618892669678, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 1.2833607196807861, "train/total_loss": 0.9399063587188721 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.18783165514469147, "train/contrastive_loss": 2.452139377593994, "train/negative_loss": 1.7211363315582275, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.7310030460357666, "train/total_loss": 0.678259551525116 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.23536640405654907, "train/contrastive_loss": 1.9533640146255493, "train/negative_loss": 1.7359412908554077, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.21742267906665802, "train/total_loss": 0.6260392069816589 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.26207321882247925, "train/contrastive_loss": 1.5476288795471191, "train/negative_loss": 1.0087196826934814, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.5389091968536377, "train/total_loss": 0.571599006652832 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2266044020652771, "train/contrastive_loss": 3.437208652496338, "train/negative_loss": 3.4371867179870605, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 2.185210178140551e-05, "train/total_loss": 0.9140461683273315 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.24644531309604645, "train/contrastive_loss": 1.173646092414856, "train/negative_loss": 0.5878365635871887, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.5858095288276672, "train/total_loss": 0.4811745285987854 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2580612301826477, "train/contrastive_loss": 2.2025082111358643, "train/negative_loss": 1.7459800243377686, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.4565282464027405, "train/total_loss": 0.6985628604888916 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.19897712767124176, "train/contrastive_loss": 3.304173469543457, "train/negative_loss": 1.8232210874557495, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.480952501296997, "train/total_loss": 0.8598118424415588 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.28154003620147705, "train/contrastive_loss": 1.8293871879577637, "train/negative_loss": 1.365809440612793, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.4635777473449707, "train/total_loss": 0.6474174857139587 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2619515657424927, "train/contrastive_loss": 2.638002395629883, "train/negative_loss": 1.7948802709579468, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.8431222438812256, "train/total_loss": 0.7895520329475403 }, { "epoch": 3.52112676056338, "eval_exact_match_accuracy": 0.1164021164021164, "eval_hamming_loss": 0.08382612304180932, "eval_loss": 0.6472141742706299, "eval_macro_f1": 0.08606886646339473, "eval_macro_precision": 0.15593506219692177, "eval_macro_recall": 0.06341313724661743, "eval_micro_f1": 0.2798573975044563, "eval_micro_precision": 0.8532608695652174, "eval_micro_recall": 0.1673773987206823, "eval_runtime": 2.839, "eval_samples_per_second": 199.715, "eval_steps_per_second": 25.008, "step": 1000 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.20714882016181946, "train/contrastive_loss": 1.2321231365203857, "train/negative_loss": 0.6984319090843201, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5336912870407104, "train/total_loss": 0.45357346534729004 }, { "epoch": 3.52112676056338, "step": 1000, "train/classification_loss": 0.2867993116378784, "train/contrastive_loss": 1.9529364109039307, "train/negative_loss": 1.218223214149475, "train/num_negatives": 22, "train/num_positives": 24, "train/positive_loss": 0.7347131967544556, "train/total_loss": 0.6773866415023804 }, { "epoch": 3.697183098591549, "grad_norm": 17.127878189086914, "learning_rate": 1.9866666666666667e-05, "loss": 0.9922, "step": 1050 }, { "epoch": 3.697183098591549, "step": 1050, "train/classification_loss": 0.2515946626663208, "train/contrastive_loss": 1.5435893535614014, "train/negative_loss": 0.8575651049613953, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.6860242486000061, "train/total_loss": 0.5603125095367432 }, { "epoch": 3.697183098591549, "step": 1050, "train/classification_loss": 0.25624769926071167, "train/contrastive_loss": 0.8319815397262573, "train/negative_loss": 0.7657333016395569, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.06624826043844223, "train/total_loss": 0.4226440191268921 }, { "epoch": 3.873239436619718, "grad_norm": 11.773343086242676, "learning_rate": 1.9859619450317125e-05, "loss": 0.9917, "step": 1100 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.23831522464752197, "train/contrastive_loss": 2.427889823913574, "train/negative_loss": 2.3044111728668213, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.12347874045372009, "train/total_loss": 0.7238931655883789 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.3279215395450592, "train/contrastive_loss": 2.4086203575134277, "train/negative_loss": 2.1797428131103516, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.22887754440307617, "train/total_loss": 0.8096456527709961 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2689489424228668, "train/contrastive_loss": 2.8508143424987793, "train/negative_loss": 2.243807554244995, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.6070067286491394, "train/total_loss": 0.8391118049621582 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.17307421565055847, "train/contrastive_loss": 2.916548252105713, "train/negative_loss": 2.9024291038513184, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.014119124040007591, "train/total_loss": 0.7563838958740234 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.23352594673633575, "train/contrastive_loss": 4.547475337982178, "train/negative_loss": 4.540761470794678, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.00671407300978899, "train/total_loss": 1.1430209875106812 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.24048519134521484, "train/contrastive_loss": 2.9878389835357666, "train/negative_loss": 2.5133676528930664, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.4744713008403778, "train/total_loss": 0.8380529880523682 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.22496269643306732, "train/contrastive_loss": 3.085120677947998, "train/negative_loss": 1.4385730028152466, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.6465476751327515, "train/total_loss": 0.8419868350028992 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2456701546907425, "train/contrastive_loss": 1.4610172510147095, "train/negative_loss": 1.4609971046447754, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 2.014657366089523e-05, "train/total_loss": 0.5378736257553101 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.17375747859477997, "train/contrastive_loss": 0.6639258861541748, "train/negative_loss": 0.5872737169265747, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.07665219157934189, "train/total_loss": 0.30654266476631165 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2648347318172455, "train/contrastive_loss": 3.2213895320892334, "train/negative_loss": 2.68839693069458, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.5329925417900085, "train/total_loss": 0.9091126918792725 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.19973190128803253, "train/contrastive_loss": 1.3084367513656616, "train/negative_loss": 1.2911714315414429, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.017265362665057182, "train/total_loss": 0.4614192843437195 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.23393574357032776, "train/contrastive_loss": 2.3132243156433105, "train/negative_loss": 2.2991549968719482, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.014069284312427044, "train/total_loss": 0.6965806484222412 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.24310286343097687, "train/contrastive_loss": 4.247648239135742, "train/negative_loss": 2.6359286308288574, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.6117196083068848, "train/total_loss": 1.092632532119751 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.257038414478302, "train/contrastive_loss": 1.3331999778747559, "train/negative_loss": 1.2541568279266357, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.07904312014579773, "train/total_loss": 0.5236784219741821 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.1624750941991806, "train/contrastive_loss": 1.777597427368164, "train/negative_loss": 0.9836911559104919, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.7939062118530273, "train/total_loss": 0.5179945826530457 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.23082579672336578, "train/contrastive_loss": 1.6016342639923096, "train/negative_loss": 1.4055243730545044, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.19610992074012756, "train/total_loss": 0.5511526465415955 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.19881311058998108, "train/contrastive_loss": 1.967290997505188, "train/negative_loss": 1.9302352666854858, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.03705578297376633, "train/total_loss": 0.5922713279724121 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.23374062776565552, "train/contrastive_loss": 2.46852445602417, "train/negative_loss": 2.39452862739563, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.07399576902389526, "train/total_loss": 0.7274454832077026 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.24928463995456696, "train/contrastive_loss": 1.578418254852295, "train/negative_loss": 1.5245360136032104, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.053882207721471786, "train/total_loss": 0.5649682879447937 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.20311260223388672, "train/contrastive_loss": 2.4354147911071777, "train/negative_loss": 2.2176971435546875, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.21771764755249023, "train/total_loss": 0.6901955604553223 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.18941310048103333, "train/contrastive_loss": 2.361656904220581, "train/negative_loss": 1.9931424856185913, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.36851444840431213, "train/total_loss": 0.6617444753646851 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.17063772678375244, "train/contrastive_loss": 2.5735113620758057, "train/negative_loss": 2.4765305519104004, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.09698088467121124, "train/total_loss": 0.6853399872779846 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2295491248369217, "train/contrastive_loss": 3.1196184158325195, "train/negative_loss": 1.6238735914230347, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.4957447052001953, "train/total_loss": 0.8534728288650513 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.26753488183021545, "train/contrastive_loss": 3.100071668624878, "train/negative_loss": 2.682760000228882, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.4173116087913513, "train/total_loss": 0.8875492811203003 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2236568033695221, "train/contrastive_loss": 1.2429547309875488, "train/negative_loss": 1.1811189651489258, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.06183582544326782, "train/total_loss": 0.47224774956703186 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.22711753845214844, "train/contrastive_loss": 3.682501792907715, "train/negative_loss": 3.281054973602295, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.4014468491077423, "train/total_loss": 0.9636179208755493 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.25347572565078735, "train/contrastive_loss": 2.073573350906372, "train/negative_loss": 2.0726492404937744, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0009240152430720627, "train/total_loss": 0.6681903600692749 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2347225546836853, "train/contrastive_loss": 1.01730215549469, "train/negative_loss": 1.0127335786819458, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.004568600561469793, "train/total_loss": 0.4381830096244812 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.26009488105773926, "train/contrastive_loss": 3.5207643508911133, "train/negative_loss": 1.9920603036880493, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.5287041664123535, "train/total_loss": 0.9642477631568909 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2768598198890686, "train/contrastive_loss": 1.423134446144104, "train/negative_loss": 1.416304588317871, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0068298340775072575, "train/total_loss": 0.5614867210388184 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.19549112021923065, "train/contrastive_loss": 2.6246564388275146, "train/negative_loss": 2.6213796138763428, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.003276816103607416, "train/total_loss": 0.7204224467277527 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2180773764848709, "train/contrastive_loss": 3.728764295578003, "train/negative_loss": 3.021785020828247, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.7069792151451111, "train/total_loss": 0.9638302326202393 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.22918613255023956, "train/contrastive_loss": 3.689828395843506, "train/negative_loss": 3.0234792232513428, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.6663492321968079, "train/total_loss": 0.9671518206596375 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.25230127573013306, "train/contrastive_loss": 3.1345293521881104, "train/negative_loss": 1.7227782011032104, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 1.4117511510849, "train/total_loss": 0.8792071342468262 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.284618616104126, "train/contrastive_loss": 2.3714370727539062, "train/negative_loss": 1.9443162679672241, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.4271208643913269, "train/total_loss": 0.7589060068130493 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.17087684571743011, "train/contrastive_loss": 2.491471767425537, "train/negative_loss": 2.4905407428741455, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.000930906506255269, "train/total_loss": 0.6691712141036987 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.25164154171943665, "train/contrastive_loss": 2.440986394882202, "train/negative_loss": 2.041640520095825, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.39934593439102173, "train/total_loss": 0.7398388385772705 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.3038838803768158, "train/contrastive_loss": 1.4890421628952026, "train/negative_loss": 1.3099987506866455, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.17904341220855713, "train/total_loss": 0.6016923189163208 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.23057648539543152, "train/contrastive_loss": 1.0312519073486328, "train/negative_loss": 0.9848721623420715, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.04637974873185158, "train/total_loss": 0.4368268847465515 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2917994260787964, "train/contrastive_loss": 5.907462120056152, "train/negative_loss": 2.056241750717163, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 3.85122013092041, "train/total_loss": 1.4732918739318848 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.17872579395771027, "train/contrastive_loss": 1.196420669555664, "train/negative_loss": 1.0647977590560913, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.13162286579608917, "train/total_loss": 0.4180099368095398 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.20605939626693726, "train/contrastive_loss": 2.464670181274414, "train/negative_loss": 2.334632635116577, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.13003748655319214, "train/total_loss": 0.698993444442749 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2552935481071472, "train/contrastive_loss": 1.8695108890533447, "train/negative_loss": 1.8687865734100342, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0007242750725708902, "train/total_loss": 0.6291956901550293 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2797108590602875, "train/contrastive_loss": 0.9901911616325378, "train/negative_loss": 0.9834886193275452, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.00670256931334734, "train/total_loss": 0.4777491092681885 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.24419371783733368, "train/contrastive_loss": 1.9920066595077515, "train/negative_loss": 1.8763504028320312, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.1156562864780426, "train/total_loss": 0.6425950527191162 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.3122989237308502, "train/contrastive_loss": 2.5958714485168457, "train/negative_loss": 1.685879111289978, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.9099923372268677, "train/total_loss": 0.8314732313156128 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.20681218802928925, "train/contrastive_loss": 2.322512626647949, "train/negative_loss": 2.1041202545166016, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.2183922678232193, "train/total_loss": 0.6713147163391113 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2414204627275467, "train/contrastive_loss": 3.609355926513672, "train/negative_loss": 3.08012318611145, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5292326211929321, "train/total_loss": 0.9632916450500488 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2742444574832916, "train/contrastive_loss": 2.749952554702759, "train/negative_loss": 2.749920606613159, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 3.194859891664237e-05, "train/total_loss": 0.8242349624633789 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.21579399704933167, "train/contrastive_loss": 2.344604969024658, "train/negative_loss": 1.9381828308105469, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.40642213821411133, "train/total_loss": 0.6847150325775146 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2289884239435196, "train/contrastive_loss": 1.2784075736999512, "train/negative_loss": 1.1660082340240479, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.11239929497241974, "train/total_loss": 0.48466992378234863 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.26019981503486633, "train/contrastive_loss": 0.932488203048706, "train/negative_loss": 0.781326413154602, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.1511618047952652, "train/total_loss": 0.446697473526001 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.23466898500919342, "train/contrastive_loss": 1.225492238998413, "train/negative_loss": 1.1051048040390015, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.12038746476173401, "train/total_loss": 0.47976744174957275 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.3182857632637024, "train/contrastive_loss": 2.451718330383301, "train/negative_loss": 2.353672504425049, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.09804584830999374, "train/total_loss": 0.8086293935775757 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.1761728674173355, "train/contrastive_loss": 1.9230961799621582, "train/negative_loss": 1.9159491062164307, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.007147099357098341, "train/total_loss": 0.560792088508606 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.17623940110206604, "train/contrastive_loss": 0.9000499248504639, "train/negative_loss": 0.8372023105621338, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.06284762918949127, "train/total_loss": 0.3562493920326233 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.21636329591274261, "train/contrastive_loss": 1.6189684867858887, "train/negative_loss": 1.589046835899353, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.029921649023890495, "train/total_loss": 0.5401570200920105 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.24555574357509613, "train/contrastive_loss": 2.163731098175049, "train/negative_loss": 1.5679959058761597, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.5957351326942444, "train/total_loss": 0.678301990032196 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.24967283010482788, "train/contrastive_loss": 1.6834166049957275, "train/negative_loss": 1.6079005002975464, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.07551614940166473, "train/total_loss": 0.5863561630249023 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.18836277723312378, "train/contrastive_loss": 0.3667788505554199, "train/negative_loss": 0.35757413506507874, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.009204700589179993, "train/total_loss": 0.2617185413837433 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2358929067850113, "train/contrastive_loss": 2.9412269592285156, "train/negative_loss": 2.490908145904541, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.4503189027309418, "train/total_loss": 0.8241382837295532 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2816947102546692, "train/contrastive_loss": 4.933274269104004, "train/negative_loss": 2.0538012981414795, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 2.8794729709625244, "train/total_loss": 1.2683496475219727 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.17934270203113556, "train/contrastive_loss": 3.210433006286621, "train/negative_loss": 2.8731000423431396, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.33733296394348145, "train/total_loss": 0.8214293122291565 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.21843379735946655, "train/contrastive_loss": 0.5027125477790833, "train/negative_loss": 0.48300161957740784, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.019710931926965714, "train/total_loss": 0.3189763128757477 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.25661149621009827, "train/contrastive_loss": 1.5218721628189087, "train/negative_loss": 1.3274472951889038, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.1944248378276825, "train/total_loss": 0.5609859228134155 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.22328856587409973, "train/contrastive_loss": 4.805528163909912, "train/negative_loss": 4.8055100440979, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 1.8239355995319784e-05, "train/total_loss": 1.1843942403793335 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.23724225163459778, "train/contrastive_loss": 1.5536742210388184, "train/negative_loss": 1.1341301202774048, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.4195440411567688, "train/total_loss": 0.547977089881897 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2464766800403595, "train/contrastive_loss": 2.8333542346954346, "train/negative_loss": 2.789071559906006, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.044282764196395874, "train/total_loss": 0.8131475448608398 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.19211798906326294, "train/contrastive_loss": 3.807598829269409, "train/negative_loss": 2.323927402496338, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.4836714267730713, "train/total_loss": 0.9536377787590027 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2839981019496918, "train/contrastive_loss": 2.131500244140625, "train/negative_loss": 1.8393489122390747, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.29215145111083984, "train/total_loss": 0.7102981805801392 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.24952849745750427, "train/contrastive_loss": 1.4020882844924927, "train/negative_loss": 1.3898981809616089, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.012190134264528751, "train/total_loss": 0.5299461483955383 }, { "epoch": 3.873239436619718, "eval_exact_match_accuracy": 0.13580246913580246, "eval_hamming_loss": 0.08185496420790539, "eval_loss": 0.7055002450942993, "eval_macro_f1": 0.0969632603746814, "eval_macro_precision": 0.2131724484665661, "eval_macro_recall": 0.07356533001391038, "eval_micro_f1": 0.31569817866435385, "eval_micro_precision": 0.8465116279069768, "eval_micro_recall": 0.19402985074626866, "eval_runtime": 2.8482, "eval_samples_per_second": 199.076, "eval_steps_per_second": 24.928, "step": 1100 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.2119203507900238, "train/contrastive_loss": 0.9280003905296326, "train/negative_loss": 0.8303496241569519, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.09765076637268066, "train/total_loss": 0.39752042293548584 }, { "epoch": 3.873239436619718, "step": 1100, "train/classification_loss": 0.20301856100559235, "train/contrastive_loss": 1.0431458950042725, "train/negative_loss": 0.81928950548172, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.22385644912719727, "train/total_loss": 0.4116477370262146 }, { "epoch": 4.049295774647887, "grad_norm": 13.688472747802734, "learning_rate": 1.9852572233967583e-05, "loss": 0.9753, "step": 1150 }, { "epoch": 4.049295774647887, "step": 1150, "train/classification_loss": 0.35411015152931213, "train/contrastive_loss": 1.787449598312378, "train/negative_loss": 1.4512560367584229, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.33619359135627747, "train/total_loss": 0.7116000652313232 }, { "epoch": 4.049295774647887, "step": 1150, "train/classification_loss": 0.23314321041107178, "train/contrastive_loss": 0.7754062414169312, "train/negative_loss": 0.6427779793739319, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.13262827694416046, "train/total_loss": 0.3882244825363159 }, { "epoch": 4.225352112676056, "grad_norm": 20.463239669799805, "learning_rate": 1.984552501761804e-05, "loss": 0.9533, "step": 1200 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.23820097744464874, "train/contrastive_loss": 2.2195143699645996, "train/negative_loss": 2.1864240169525146, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.033090438693761826, "train/total_loss": 0.6821038722991943 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.3126511871814728, "train/contrastive_loss": 1.3029661178588867, "train/negative_loss": 0.6426699757575989, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.6602961421012878, "train/total_loss": 0.5732444524765015 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.26902809739112854, "train/contrastive_loss": 3.3653273582458496, "train/negative_loss": 2.093282461166382, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.2720450162887573, "train/total_loss": 0.9420936107635498 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.16100594401359558, "train/contrastive_loss": 1.5097841024398804, "train/negative_loss": 1.4639619588851929, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.04582216963171959, "train/total_loss": 0.4629627764225006 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.23391561210155487, "train/contrastive_loss": 2.871906280517578, "train/negative_loss": 2.5959837436676025, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.2759224474430084, "train/total_loss": 0.8082969188690186 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.23714615404605865, "train/contrastive_loss": 2.5147595405578613, "train/negative_loss": 1.66135573387146, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.8534036874771118, "train/total_loss": 0.7400980591773987 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.22908292710781097, "train/contrastive_loss": 2.4958722591400146, "train/negative_loss": 1.5669571161270142, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.9289150834083557, "train/total_loss": 0.7282573580741882 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.24315716326236725, "train/contrastive_loss": 1.147068977355957, "train/negative_loss": 1.146935224533081, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.000133761772303842, "train/total_loss": 0.4725709557533264 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.16732251644134521, "train/contrastive_loss": 0.6897497773170471, "train/negative_loss": 0.4277394711971283, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.2620103061199188, "train/total_loss": 0.3052724599838257 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.25074175000190735, "train/contrastive_loss": 2.818326711654663, "train/negative_loss": 1.9771109819412231, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.8412157297134399, "train/total_loss": 0.8144071102142334 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.20019780099391937, "train/contrastive_loss": 2.1182432174682617, "train/negative_loss": 0.9785182476043701, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 1.139724850654602, "train/total_loss": 0.6238464713096619 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.22391721606254578, "train/contrastive_loss": 1.2828621864318848, "train/negative_loss": 1.268310785293579, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.014551392756402493, "train/total_loss": 0.48048967123031616 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.23621715605258942, "train/contrastive_loss": 3.8077096939086914, "train/negative_loss": 2.278451681137085, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.529257893562317, "train/total_loss": 0.9977591037750244 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2610945701599121, "train/contrastive_loss": 1.9956432580947876, "train/negative_loss": 1.9374083280563354, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.058234892785549164, "train/total_loss": 0.6602232456207275 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.16263200342655182, "train/contrastive_loss": 2.7147724628448486, "train/negative_loss": 0.9403889775276184, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.774383544921875, "train/total_loss": 0.7055864930152893 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.22432219982147217, "train/contrastive_loss": 2.260737895965576, "train/negative_loss": 1.2054569721221924, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.0552810430526733, "train/total_loss": 0.6764698028564453 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.18923906981945038, "train/contrastive_loss": 1.4630100727081299, "train/negative_loss": 0.9888707399368286, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.47413939237594604, "train/total_loss": 0.4818410873413086 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.22521206736564636, "train/contrastive_loss": 2.3338253498077393, "train/negative_loss": 2.046501636505127, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.28732380270957947, "train/total_loss": 0.6919771432876587 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.22657722234725952, "train/contrastive_loss": 1.4559969902038574, "train/negative_loss": 0.9023036360740662, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.553693413734436, "train/total_loss": 0.517776608467102 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2026662528514862, "train/contrastive_loss": 3.5434229373931885, "train/negative_loss": 2.0275583267211914, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.515864610671997, "train/total_loss": 0.9113508462905884 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.1881251037120819, "train/contrastive_loss": 1.39735746383667, "train/negative_loss": 1.3268437385559082, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.07051370292901993, "train/total_loss": 0.4675965905189514 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.16246214509010315, "train/contrastive_loss": 2.396956443786621, "train/negative_loss": 1.8029283285140991, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.594028115272522, "train/total_loss": 0.6418534517288208 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.22203607857227325, "train/contrastive_loss": 2.9253249168395996, "train/negative_loss": 1.178288221359253, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.7470366954803467, "train/total_loss": 0.8071010708808899 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2596926987171173, "train/contrastive_loss": 2.795374870300293, "train/negative_loss": 1.4317823648452759, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.3635923862457275, "train/total_loss": 0.8187676668167114 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.21991199254989624, "train/contrastive_loss": 1.9777274131774902, "train/negative_loss": 1.2168290615081787, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.7608982920646667, "train/total_loss": 0.6154574751853943 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2313278615474701, "train/contrastive_loss": 2.268214702606201, "train/negative_loss": 1.3194770812988281, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.948737621307373, "train/total_loss": 0.6849707961082458 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2507913410663605, "train/contrastive_loss": 2.532198905944824, "train/negative_loss": 2.511834144592285, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.02036474645137787, "train/total_loss": 0.7572311162948608 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.22977498173713684, "train/contrastive_loss": 0.4995616674423218, "train/negative_loss": 0.4863865375518799, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.013175136409699917, "train/total_loss": 0.32968732714653015 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2593741714954376, "train/contrastive_loss": 3.8490519523620605, "train/negative_loss": 2.156369686126709, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.692682147026062, "train/total_loss": 1.0291845798492432 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2559356689453125, "train/contrastive_loss": 0.7395895719528198, "train/negative_loss": 0.7330122590065002, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.006577320396900177, "train/total_loss": 0.4038535952568054 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.18498210608959198, "train/contrastive_loss": 1.246114730834961, "train/negative_loss": 1.2213551998138428, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.024759579449892044, "train/total_loss": 0.4342050552368164 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.21050065755844116, "train/contrastive_loss": 3.0388805866241455, "train/negative_loss": 2.182076930999756, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.8568036556243896, "train/total_loss": 0.8182767629623413 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.21962806582450867, "train/contrastive_loss": 2.28347110748291, "train/negative_loss": 1.1052113771438599, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.1782597303390503, "train/total_loss": 0.6763222813606262 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2414647489786148, "train/contrastive_loss": 2.0475215911865234, "train/negative_loss": 1.9549386501312256, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.09258290380239487, "train/total_loss": 0.6509690880775452 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.26383158564567566, "train/contrastive_loss": 3.209746837615967, "train/negative_loss": 1.8684909343719482, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.3412559032440186, "train/total_loss": 0.9057809114456177 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.16165506839752197, "train/contrastive_loss": 1.9002012014389038, "train/negative_loss": 1.8871245384216309, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.013076669536530972, "train/total_loss": 0.5416953563690186 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2387543022632599, "train/contrastive_loss": 1.91302490234375, "train/negative_loss": 1.2365256547927856, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.6764992475509644, "train/total_loss": 0.6213592886924744 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2853037416934967, "train/contrastive_loss": 3.1011276245117188, "train/negative_loss": 3.092477560043335, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.00864995177835226, "train/total_loss": 0.905529260635376 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.22179660201072693, "train/contrastive_loss": 0.533164381980896, "train/negative_loss": 0.5205826163291931, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.0125817796215415, "train/total_loss": 0.3284294903278351 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.27831244468688965, "train/contrastive_loss": 5.48289680480957, "train/negative_loss": 3.590162754058838, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.8927342891693115, "train/total_loss": 1.3748918771743774 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.17007887363433838, "train/contrastive_loss": 0.6487374305725098, "train/negative_loss": 0.5470332503318787, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.1017041951417923, "train/total_loss": 0.29982638359069824 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.20303687453269958, "train/contrastive_loss": 2.851569652557373, "train/negative_loss": 1.6394004821777344, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.2121692895889282, "train/total_loss": 0.7733508348464966 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2422710806131363, "train/contrastive_loss": 1.0220674276351929, "train/negative_loss": 1.0196876525878906, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.002379767596721649, "train/total_loss": 0.4466845691204071 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.27504763007164, "train/contrastive_loss": 1.2418322563171387, "train/negative_loss": 1.2355135679244995, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.006318744271993637, "train/total_loss": 0.5234140753746033 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2379591315984726, "train/contrastive_loss": 1.6048810482025146, "train/negative_loss": 1.3263897895812988, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.2784913182258606, "train/total_loss": 0.5589353442192078 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.3087451159954071, "train/contrastive_loss": 3.5816688537597656, "train/negative_loss": 3.331193447113037, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.25047552585601807, "train/total_loss": 1.0250788927078247 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.19379587471485138, "train/contrastive_loss": 1.7554895877838135, "train/negative_loss": 1.3410553932189941, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.41443419456481934, "train/total_loss": 0.5448938012123108 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2315230667591095, "train/contrastive_loss": 2.369478225708008, "train/negative_loss": 1.7959967851638794, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.573481559753418, "train/total_loss": 0.7054187059402466 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2758389115333557, "train/contrastive_loss": 2.6423323154449463, "train/negative_loss": 2.6422619819641113, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 7.033595466054976e-05, "train/total_loss": 0.804305374622345 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.21867045760154724, "train/contrastive_loss": 2.055758237838745, "train/negative_loss": 1.3003343343734741, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.755423903465271, "train/total_loss": 0.6298221349716187 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.21739840507507324, "train/contrastive_loss": 1.3960161209106445, "train/negative_loss": 1.1293599605560303, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.26665621995925903, "train/total_loss": 0.4966016411781311 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.24844343960285187, "train/contrastive_loss": 0.8801074028015137, "train/negative_loss": 0.4586319029331207, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.42147552967071533, "train/total_loss": 0.4244649410247803 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.23639611899852753, "train/contrastive_loss": 1.2823047637939453, "train/negative_loss": 0.7736068367958069, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.5086979269981384, "train/total_loss": 0.49285709857940674 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.31819280982017517, "train/contrastive_loss": 2.318375825881958, "train/negative_loss": 1.9652572870254517, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.3531185984611511, "train/total_loss": 0.7818679809570312 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.1730251908302307, "train/contrastive_loss": 1.403673768043518, "train/negative_loss": 1.2460966110229492, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.15757720172405243, "train/total_loss": 0.45375993847846985 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.1673741340637207, "train/contrastive_loss": 1.0294147729873657, "train/negative_loss": 0.5770444273948669, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.4523703157901764, "train/total_loss": 0.3732571005821228 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2136966735124588, "train/contrastive_loss": 3.459001302719116, "train/negative_loss": 1.811866283416748, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.6471350193023682, "train/total_loss": 0.9054969549179077 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.230219304561615, "train/contrastive_loss": 2.9058241844177246, "train/negative_loss": 1.434438705444336, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.4713853597640991, "train/total_loss": 0.8113841414451599 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.24400371313095093, "train/contrastive_loss": 1.9538731575012207, "train/negative_loss": 1.9181960821151733, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.03567707538604736, "train/total_loss": 0.6347783803939819 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.180061936378479, "train/contrastive_loss": 0.370182603597641, "train/negative_loss": 0.34648385643959045, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.02369873598217964, "train/total_loss": 0.25409847497940063 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.21889282763004303, "train/contrastive_loss": 2.6643178462982178, "train/negative_loss": 1.7027565240859985, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.961561381816864, "train/total_loss": 0.7517563700675964 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2903638184070587, "train/contrastive_loss": 2.4090704917907715, "train/negative_loss": 1.8289307355880737, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.5801397562026978, "train/total_loss": 0.7721779346466064 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.17654463648796082, "train/contrastive_loss": 2.6437220573425293, "train/negative_loss": 1.5578287839889526, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.0858933925628662, "train/total_loss": 0.7052890062332153 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2135140597820282, "train/contrastive_loss": 1.1043596267700195, "train/negative_loss": 0.9168818593025208, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.18747779726982117, "train/total_loss": 0.4343859851360321 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.23641914129257202, "train/contrastive_loss": 1.5262194871902466, "train/negative_loss": 0.9449999928474426, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.581219494342804, "train/total_loss": 0.5416630506515503 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.21804450452327728, "train/contrastive_loss": 4.433368682861328, "train/negative_loss": 4.43336296081543, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 5.877047897229204e-06, "train/total_loss": 1.1047182083129883 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.22903616726398468, "train/contrastive_loss": 1.26973557472229, "train/negative_loss": 1.2510457038879395, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.018689824268221855, "train/total_loss": 0.4829832911491394 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2400054931640625, "train/contrastive_loss": 2.513589382171631, "train/negative_loss": 1.3694665431976318, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.144122838973999, "train/total_loss": 0.7427234053611755 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.18603594601154327, "train/contrastive_loss": 2.5822553634643555, "train/negative_loss": 1.6960792541503906, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.8861759901046753, "train/total_loss": 0.7024869918823242 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.26890575885772705, "train/contrastive_loss": 2.616194725036621, "train/negative_loss": 2.1009938716888428, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.5152009725570679, "train/total_loss": 0.7921447157859802 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.2412821352481842, "train/contrastive_loss": 1.127841830253601, "train/negative_loss": 0.8097090721130371, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.3181327283382416, "train/total_loss": 0.46685051918029785 }, { "epoch": 4.225352112676056, "eval_exact_match_accuracy": 0.18342151675485008, "eval_hamming_loss": 0.07666770411868451, "eval_loss": 0.655646026134491, "eval_macro_f1": 0.1646030455442915, "eval_macro_precision": 0.2693936266691685, "eval_macro_recall": 0.12418034188159713, "eval_micro_f1": 0.38365304420350294, "eval_micro_precision": 0.8812260536398467, "eval_micro_recall": 0.24520255863539445, "eval_runtime": 2.8396, "eval_samples_per_second": 199.678, "eval_steps_per_second": 25.004, "step": 1200 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.23825527727603912, "train/contrastive_loss": 2.3279671669006348, "train/negative_loss": 1.4855165481567383, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.8424504995346069, "train/total_loss": 0.7038487195968628 }, { "epoch": 4.225352112676056, "step": 1200, "train/classification_loss": 0.1869194060564041, "train/contrastive_loss": 2.0423145294189453, "train/negative_loss": 1.075447916984558, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.9668665528297424, "train/total_loss": 0.5953823328018188 }, { "epoch": 4.401408450704225, "grad_norm": 14.286855697631836, "learning_rate": 1.98384778012685e-05, "loss": 0.9638, "step": 1250 }, { "epoch": 4.401408450704225, "step": 1250, "train/classification_loss": 0.19104373455047607, "train/contrastive_loss": 0.6243109703063965, "train/negative_loss": 0.6222519278526306, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.0020590173080563545, "train/total_loss": 0.31590592861175537 }, { "epoch": 4.401408450704225, "step": 1250, "train/classification_loss": 0.20892855525016785, "train/contrastive_loss": 0.9095954895019531, "train/negative_loss": 0.4751937687397003, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4344017505645752, "train/total_loss": 0.39084765315055847 }, { "epoch": 4.577464788732394, "grad_norm": 14.127750396728516, "learning_rate": 1.9831430584918957e-05, "loss": 0.9747, "step": 1300 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.23401476442813873, "train/contrastive_loss": 1.5566043853759766, "train/negative_loss": 1.1262366771697998, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.43036770820617676, "train/total_loss": 0.5453356504440308 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.3032030761241913, "train/contrastive_loss": 0.8808788657188416, "train/negative_loss": 0.7914912700653076, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.08938758075237274, "train/total_loss": 0.4793788492679596 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2706410884857178, "train/contrastive_loss": 3.123760938644409, "train/negative_loss": 1.550243854522705, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.573517084121704, "train/total_loss": 0.8953933119773865 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.15798883140087128, "train/contrastive_loss": 1.3137962818145752, "train/negative_loss": 0.822451114654541, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.49134519696235657, "train/total_loss": 0.42074811458587646 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.22797857224941254, "train/contrastive_loss": 2.997321128845215, "train/negative_loss": 2.844057083129883, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.15326400101184845, "train/total_loss": 0.8274428248405457 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2316315919160843, "train/contrastive_loss": 2.246314525604248, "train/negative_loss": 1.2781991958618164, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.9681152701377869, "train/total_loss": 0.6808944940567017 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.23319797217845917, "train/contrastive_loss": 1.6386709213256836, "train/negative_loss": 1.2055596113204956, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.4331112802028656, "train/total_loss": 0.5609321594238281 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.23404213786125183, "train/contrastive_loss": 1.2143553495407104, "train/negative_loss": 1.2142421007156372, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.00011325523519190028, "train/total_loss": 0.4769132137298584 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.15626783668994904, "train/contrastive_loss": 0.5440346002578735, "train/negative_loss": 0.45632341504096985, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.08771121501922607, "train/total_loss": 0.265074759721756 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.25827547907829285, "train/contrastive_loss": 3.0953986644744873, "train/negative_loss": 2.4372997283935547, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.6580989360809326, "train/total_loss": 0.8773552179336548 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.19195662438869476, "train/contrastive_loss": 1.2604176998138428, "train/negative_loss": 0.9611589312553406, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.2992587685585022, "train/total_loss": 0.4440401792526245 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.21832390129566193, "train/contrastive_loss": 2.0778255462646484, "train/negative_loss": 1.519291639328003, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.5585338473320007, "train/total_loss": 0.6338890194892883 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.23998992145061493, "train/contrastive_loss": 3.333832263946533, "train/negative_loss": 1.804917335510254, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.5289148092269897, "train/total_loss": 0.9067564010620117 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2453434020280838, "train/contrastive_loss": 1.5505229234695435, "train/negative_loss": 1.1107038259506226, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.4398190975189209, "train/total_loss": 0.5554479956626892 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.1536543369293213, "train/contrastive_loss": 1.608515977859497, "train/negative_loss": 0.882408618927002, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.7261072993278503, "train/total_loss": 0.4753575325012207 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2283710390329361, "train/contrastive_loss": 1.872093677520752, "train/negative_loss": 1.0226361751556396, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.8494575023651123, "train/total_loss": 0.6027897596359253 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.1807592660188675, "train/contrastive_loss": 1.440096378326416, "train/negative_loss": 0.8546149134635925, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5854814052581787, "train/total_loss": 0.4687785506248474 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.23544827103614807, "train/contrastive_loss": 3.3001837730407715, "train/negative_loss": 2.247168779373169, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 1.0530149936676025, "train/total_loss": 0.8954850435256958 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2252124696969986, "train/contrastive_loss": 1.0233691930770874, "train/negative_loss": 0.8507015705108643, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.17266766726970673, "train/total_loss": 0.4298863112926483 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.19599266350269318, "train/contrastive_loss": 2.6318631172180176, "train/negative_loss": 1.7453365325927734, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8865267038345337, "train/total_loss": 0.7223652601242065 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.1796572357416153, "train/contrastive_loss": 2.135979652404785, "train/negative_loss": 2.044992685317993, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.09098690003156662, "train/total_loss": 0.606853187084198 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.15876658260822296, "train/contrastive_loss": 2.268186092376709, "train/negative_loss": 1.7233991622924805, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.5447870492935181, "train/total_loss": 0.6124038100242615 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.22039884328842163, "train/contrastive_loss": 3.5753307342529297, "train/negative_loss": 1.9010919332504272, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.674238681793213, "train/total_loss": 0.9354649782180786 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.26601025462150574, "train/contrastive_loss": 3.0995233058929443, "train/negative_loss": 1.4762790203094482, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.623244285583496, "train/total_loss": 0.8859149217605591 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.20932075381278992, "train/contrastive_loss": 1.5616726875305176, "train/negative_loss": 0.7338090538978577, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.8278636932373047, "train/total_loss": 0.5216553211212158 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.22062526643276215, "train/contrastive_loss": 3.1800804138183594, "train/negative_loss": 1.8454644680023193, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.3346158266067505, "train/total_loss": 0.8566413521766663 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.24183550477027893, "train/contrastive_loss": 1.7665767669677734, "train/negative_loss": 1.6985372304916382, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.06803955137729645, "train/total_loss": 0.5951508283615112 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.22191646695137024, "train/contrastive_loss": 0.7853184342384338, "train/negative_loss": 0.7448700666427612, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.04044835641980171, "train/total_loss": 0.3789801597595215 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2545104920864105, "train/contrastive_loss": 2.4410057067871094, "train/negative_loss": 1.145552158355713, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.295453667640686, "train/total_loss": 0.7427116632461548 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.253305584192276, "train/contrastive_loss": 0.8166927099227905, "train/negative_loss": 0.811310887336731, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.005381798837333918, "train/total_loss": 0.4166441261768341 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.1783934235572815, "train/contrastive_loss": 1.362443447113037, "train/negative_loss": 1.3614118099212646, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0010316881816834211, "train/total_loss": 0.45088210701942444 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2097310572862625, "train/contrastive_loss": 2.6462390422821045, "train/negative_loss": 1.9738372564315796, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.6724017858505249, "train/total_loss": 0.7389788627624512 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.21386770904064178, "train/contrastive_loss": 1.8183174133300781, "train/negative_loss": 1.460629940032959, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.3576875329017639, "train/total_loss": 0.5775312185287476 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2335360199213028, "train/contrastive_loss": 1.8065866231918335, "train/negative_loss": 1.7047090530395508, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.10187755525112152, "train/total_loss": 0.5948533415794373 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2644630968570709, "train/contrastive_loss": 3.0111443996429443, "train/negative_loss": 1.7868986129760742, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.2242457866668701, "train/total_loss": 0.8666919469833374 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.15774653851985931, "train/contrastive_loss": 1.5923125743865967, "train/negative_loss": 1.5920966863632202, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.00021586695220321417, "train/total_loss": 0.47620904445648193 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.22504517436027527, "train/contrastive_loss": 1.5546013116836548, "train/negative_loss": 1.1543443202972412, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.40025702118873596, "train/total_loss": 0.5359654426574707 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2818101644515991, "train/contrastive_loss": 2.370673894882202, "train/negative_loss": 2.32077956199646, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.049894239753484726, "train/total_loss": 0.7559449672698975 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.21561689674854279, "train/contrastive_loss": 0.12947344779968262, "train/negative_loss": 0.12818895280361176, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.0012845013989135623, "train/total_loss": 0.24151158332824707 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2862207293510437, "train/contrastive_loss": 4.021243095397949, "train/negative_loss": 2.4355289936065674, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.5857142210006714, "train/total_loss": 1.0904693603515625 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.1605284959077835, "train/contrastive_loss": 0.9733806848526001, "train/negative_loss": 0.7981491088867188, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.17523156106472015, "train/total_loss": 0.35520464181900024 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2003738433122635, "train/contrastive_loss": 2.7260022163391113, "train/negative_loss": 1.368889570236206, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.3571126461029053, "train/total_loss": 0.7455742955207825 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.23827454447746277, "train/contrastive_loss": 0.8021093010902405, "train/negative_loss": 0.8008567690849304, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0012525434140115976, "train/total_loss": 0.3986964225769043 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.26579779386520386, "train/contrastive_loss": 1.3488194942474365, "train/negative_loss": 1.3370717763900757, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.011747724376618862, "train/total_loss": 0.5355616807937622 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2275983840227127, "train/contrastive_loss": 1.4242030382156372, "train/negative_loss": 1.3714383840560913, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.052764710038900375, "train/total_loss": 0.5124390125274658 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.3079846203327179, "train/contrastive_loss": 3.3644702434539795, "train/negative_loss": 2.594789743423462, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.7696805000305176, "train/total_loss": 0.9808787107467651 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.1919877976179123, "train/contrastive_loss": 2.4588255882263184, "train/negative_loss": 1.198575496673584, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.2602500915527344, "train/total_loss": 0.6837528944015503 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.22943200170993805, "train/contrastive_loss": 2.4177746772766113, "train/negative_loss": 1.6359587907791138, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7818158268928528, "train/total_loss": 0.712986946105957 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.27851197123527527, "train/contrastive_loss": 2.978896141052246, "train/negative_loss": 2.9785914421081543, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.00030462612630799413, "train/total_loss": 0.874291181564331 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2117909938097, "train/contrastive_loss": 1.9047844409942627, "train/negative_loss": 1.1458433866500854, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.7589410543441772, "train/total_loss": 0.5927478671073914 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2072007805109024, "train/contrastive_loss": 0.7204608917236328, "train/negative_loss": 0.685080349445343, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.035380519926548004, "train/total_loss": 0.3512929677963257 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2516249418258667, "train/contrastive_loss": 1.2834277153015137, "train/negative_loss": 0.7897829413414001, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.4936448037624359, "train/total_loss": 0.5083104968070984 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2277771234512329, "train/contrastive_loss": 0.9544593095779419, "train/negative_loss": 0.6912152171134949, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.263244092464447, "train/total_loss": 0.4186689853668213 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.3175206780433655, "train/contrastive_loss": 2.5090723037719727, "train/negative_loss": 1.6274548768997192, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.881617546081543, "train/total_loss": 0.8193351626396179 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.16671912372112274, "train/contrastive_loss": 0.7467590570449829, "train/negative_loss": 0.6714926958084106, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.07526636123657227, "train/total_loss": 0.31607094407081604 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.1625654250383377, "train/contrastive_loss": 0.42692652344703674, "train/negative_loss": 0.272882342338562, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.15404418110847473, "train/total_loss": 0.2479507327079773 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.1999031901359558, "train/contrastive_loss": 0.9797678589820862, "train/negative_loss": 0.9129236340522766, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.06684423238039017, "train/total_loss": 0.3958567678928375 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.23402690887451172, "train/contrastive_loss": 3.5618300437927246, "train/negative_loss": 1.1926548480987549, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 2.3691751956939697, "train/total_loss": 0.9463929533958435 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2535379230976105, "train/contrastive_loss": 2.0842363834381104, "train/negative_loss": 1.8566031455993652, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.2276332825422287, "train/total_loss": 0.6703852415084839 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.17132024466991425, "train/contrastive_loss": 0.400510311126709, "train/negative_loss": 0.3717068135738373, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.02880351059138775, "train/total_loss": 0.25142231583595276 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2238728255033493, "train/contrastive_loss": 2.9969887733459473, "train/negative_loss": 1.5601463317871094, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.4368423223495483, "train/total_loss": 0.8232706189155579 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.28535664081573486, "train/contrastive_loss": 2.485658884048462, "train/negative_loss": 2.0277631282806396, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.45789575576782227, "train/total_loss": 0.7824884653091431 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.17268261313438416, "train/contrastive_loss": 1.8713536262512207, "train/negative_loss": 1.5168644189834595, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.354489266872406, "train/total_loss": 0.5469533205032349 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.21092760562896729, "train/contrastive_loss": 0.8458287715911865, "train/negative_loss": 0.7711238861083984, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.07470490038394928, "train/total_loss": 0.38009336590766907 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.22525931894779205, "train/contrastive_loss": 1.6337599754333496, "train/negative_loss": 0.45575714111328125, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.1780028343200684, "train/total_loss": 0.5520113110542297 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.21781055629253387, "train/contrastive_loss": 4.552392959594727, "train/negative_loss": 4.552349090576172, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 4.367647852632217e-05, "train/total_loss": 1.1282891035079956 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.21694669127464294, "train/contrastive_loss": 0.8992151021957397, "train/negative_loss": 0.6574814319610596, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.24173367023468018, "train/total_loss": 0.3967897295951843 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.23654568195343018, "train/contrastive_loss": 1.8724230527877808, "train/negative_loss": 1.4034903049468994, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.46893274784088135, "train/total_loss": 0.6110303401947021 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.18248401582241058, "train/contrastive_loss": 2.415851593017578, "train/negative_loss": 1.0401480197906494, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.3757035732269287, "train/total_loss": 0.6656543612480164 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2719835340976715, "train/contrastive_loss": 2.2993414402008057, "train/negative_loss": 2.076965093612671, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.22237637639045715, "train/total_loss": 0.7318518161773682 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.2427232563495636, "train/contrastive_loss": 2.012882947921753, "train/negative_loss": 1.3373515605926514, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.6755313873291016, "train/total_loss": 0.6452998518943787 }, { "epoch": 4.577464788732394, "eval_exact_match_accuracy": 0.20105820105820105, "eval_hamming_loss": 0.07563025210084033, "eval_loss": 0.6144142746925354, "eval_macro_f1": 0.16896361025951567, "eval_macro_precision": 0.2716061903688679, "eval_macro_recall": 0.128501009843108, "eval_micro_f1": 0.4, "eval_micro_precision": 0.8772563176895307, "eval_micro_recall": 0.25906183368869934, "eval_runtime": 2.8436, "eval_samples_per_second": 199.398, "eval_steps_per_second": 24.969, "step": 1300 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.22063268721103668, "train/contrastive_loss": 0.9216023087501526, "train/negative_loss": 0.7635083198547363, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.15809400379657745, "train/total_loss": 0.40495315194129944 }, { "epoch": 4.577464788732394, "step": 1300, "train/classification_loss": 0.16536462306976318, "train/contrastive_loss": 0.5875394940376282, "train/negative_loss": 0.5407856702804565, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.04675380885601044, "train/total_loss": 0.2828725278377533 }, { "epoch": 4.753521126760563, "grad_norm": 14.944501876831055, "learning_rate": 1.982438336856942e-05, "loss": 0.9271, "step": 1350 }, { "epoch": 4.753521126760563, "step": 1350, "train/classification_loss": 0.21598052978515625, "train/contrastive_loss": 1.0731817483901978, "train/negative_loss": 1.0209242105484009, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.052257586270570755, "train/total_loss": 0.4306168854236603 }, { "epoch": 4.753521126760563, "step": 1350, "train/classification_loss": 0.23102152347564697, "train/contrastive_loss": 1.7591127157211304, "train/negative_loss": 1.6203545331954956, "train/num_negatives": 28, "train/num_positives": 20, "train/positive_loss": 0.13875816762447357, "train/total_loss": 0.582844078540802 }, { "epoch": 4.929577464788732, "grad_norm": 12.897309303283691, "learning_rate": 1.9817336152219873e-05, "loss": 0.9275, "step": 1400 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.23393715918064117, "train/contrastive_loss": 1.4722117185592651, "train/negative_loss": 1.2722023725509644, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.2000093311071396, "train/total_loss": 0.528379499912262 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2999577224254608, "train/contrastive_loss": 1.2361167669296265, "train/negative_loss": 0.8706927299499512, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.3654240369796753, "train/total_loss": 0.5471810698509216 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.25975456833839417, "train/contrastive_loss": 2.3680732250213623, "train/negative_loss": 1.2489418983459473, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.119131326675415, "train/total_loss": 0.7333692312240601 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.15801315009593964, "train/contrastive_loss": 0.7145366072654724, "train/negative_loss": 0.6202155351638794, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.09432106465101242, "train/total_loss": 0.3009204864501953 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.21140454709529877, "train/contrastive_loss": 2.6877408027648926, "train/negative_loss": 2.503927230834961, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.18381357192993164, "train/total_loss": 0.7489527463912964 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.22213847935199738, "train/contrastive_loss": 2.550034999847412, "train/negative_loss": 1.4603843688964844, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.0896506309509277, "train/total_loss": 0.7321454882621765 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.20857639610767365, "train/contrastive_loss": 2.272698402404785, "train/negative_loss": 1.4846333265304565, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.7880651354789734, "train/total_loss": 0.6631160974502563 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.22684897482395172, "train/contrastive_loss": 0.9840952754020691, "train/negative_loss": 0.9840511679649353, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 4.4108408474130556e-05, "train/total_loss": 0.4236680269241333 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.1542213410139084, "train/contrastive_loss": 0.6024507284164429, "train/negative_loss": 0.543899655342102, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.058551084250211716, "train/total_loss": 0.2747114896774292 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2476825714111328, "train/contrastive_loss": 3.0360355377197266, "train/negative_loss": 1.9377377033233643, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.0982978343963623, "train/total_loss": 0.8548896908760071 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.1866694837808609, "train/contrastive_loss": 1.3327810764312744, "train/negative_loss": 0.9623618125915527, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.3704192340373993, "train/total_loss": 0.4532257318496704 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.21355567872524261, "train/contrastive_loss": 1.8908418416976929, "train/negative_loss": 1.8872884511947632, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.003553333692252636, "train/total_loss": 0.5917240381240845 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.24093280732631683, "train/contrastive_loss": 3.631753921508789, "train/negative_loss": 2.140901565551758, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.4908523559570312, "train/total_loss": 0.9672836065292358 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.23973363637924194, "train/contrastive_loss": 1.4302055835723877, "train/negative_loss": 1.3044441938400269, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.12576135993003845, "train/total_loss": 0.5257747173309326 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.15119034051895142, "train/contrastive_loss": 2.565791368484497, "train/negative_loss": 0.7071977257728577, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.8585937023162842, "train/total_loss": 0.6643486022949219 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.20661590993404388, "train/contrastive_loss": 1.4633798599243164, "train/negative_loss": 0.785781979560852, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.6775978803634644, "train/total_loss": 0.49929189682006836 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.17302308976650238, "train/contrastive_loss": 1.5027965307235718, "train/negative_loss": 1.095802903175354, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4069935977458954, "train/total_loss": 0.47358238697052 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.20444808900356293, "train/contrastive_loss": 1.4097462892532349, "train/negative_loss": 1.1200119256973267, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.2897343337535858, "train/total_loss": 0.48639732599258423 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.22217759490013123, "train/contrastive_loss": 1.3416063785552979, "train/negative_loss": 1.2977246046066284, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.04388182982802391, "train/total_loss": 0.4904988706111908 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.19605687260627747, "train/contrastive_loss": 3.1035685539245605, "train/negative_loss": 1.8977183103561401, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.20585036277771, "train/total_loss": 0.8167705535888672 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.17438937723636627, "train/contrastive_loss": 1.1631836891174316, "train/negative_loss": 1.144606351852417, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.018577340990304947, "train/total_loss": 0.40702611207962036 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.14891044795513153, "train/contrastive_loss": 1.7904173135757446, "train/negative_loss": 1.5921657085418701, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.1982516199350357, "train/total_loss": 0.5069938898086548 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2139759659767151, "train/contrastive_loss": 3.727570056915283, "train/negative_loss": 1.7804551124572754, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.9471148252487183, "train/total_loss": 0.9594900012016296 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2626914083957672, "train/contrastive_loss": 2.6890525817871094, "train/negative_loss": 1.2976715564727783, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.391381025314331, "train/total_loss": 0.8005019426345825 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.19910500943660736, "train/contrastive_loss": 1.7909460067749023, "train/negative_loss": 0.870284914970398, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.9206610918045044, "train/total_loss": 0.5572941899299622 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2213013619184494, "train/contrastive_loss": 3.4536094665527344, "train/negative_loss": 2.116147041320801, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.3374624252319336, "train/total_loss": 0.9120233058929443 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.23854103684425354, "train/contrastive_loss": 1.6801559925079346, "train/negative_loss": 1.675628423690796, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.004527554847300053, "train/total_loss": 0.5745722055435181 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.21013152599334717, "train/contrastive_loss": 0.3212376534938812, "train/negative_loss": 0.3000991940498352, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.021138465031981468, "train/total_loss": 0.27437907457351685 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2551615238189697, "train/contrastive_loss": 2.024010181427002, "train/negative_loss": 0.9517756104469299, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.0722346305847168, "train/total_loss": 0.6599636077880859 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.24212419986724854, "train/contrastive_loss": 0.7657091021537781, "train/negative_loss": 0.7523344159126282, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.013374675996601582, "train/total_loss": 0.39526602625846863 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.1769164353609085, "train/contrastive_loss": 1.89718496799469, "train/negative_loss": 1.8965978622436523, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0005871434696018696, "train/total_loss": 0.5563534498214722 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.20006434619426727, "train/contrastive_loss": 3.621943712234497, "train/negative_loss": 2.390413999557495, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.231529712677002, "train/total_loss": 0.9244531393051147 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.21074402332305908, "train/contrastive_loss": 2.6736202239990234, "train/negative_loss": 1.5347355604171753, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.1388845443725586, "train/total_loss": 0.7454680800437927 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.23172606527805328, "train/contrastive_loss": 1.8997231721878052, "train/negative_loss": 1.5308058261871338, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.368917316198349, "train/total_loss": 0.611670732498169 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.24845577776432037, "train/contrastive_loss": 1.744419813156128, "train/negative_loss": 1.3105539083480835, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.43386590480804443, "train/total_loss": 0.5973397493362427 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.16125430166721344, "train/contrastive_loss": 2.1428160667419434, "train/negative_loss": 1.9983477592468262, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.14446841180324554, "train/total_loss": 0.5898175239562988 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.23195935785770416, "train/contrastive_loss": 1.6570932865142822, "train/negative_loss": 1.1011319160461426, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.5559613108634949, "train/total_loss": 0.5633780360221863 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.26865336298942566, "train/contrastive_loss": 3.343217611312866, "train/negative_loss": 2.9467906951904297, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.3964269161224365, "train/total_loss": 0.9372968673706055 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.21648384630680084, "train/contrastive_loss": 1.1829619407653809, "train/negative_loss": 0.5028421878814697, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.6801196932792664, "train/total_loss": 0.45307624340057373 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.28715255856513977, "train/contrastive_loss": 3.8815360069274902, "train/negative_loss": 1.99509596824646, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.8864400386810303, "train/total_loss": 1.0634597539901733 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.15984392166137695, "train/contrastive_loss": 1.2444604635238647, "train/negative_loss": 0.7440666556358337, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.500393807888031, "train/total_loss": 0.4087360203266144 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.1855562925338745, "train/contrastive_loss": 1.7380281686782837, "train/negative_loss": 1.3140361309051514, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.42399200797080994, "train/total_loss": 0.5331619381904602 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.22104769945144653, "train/contrastive_loss": 1.1489006280899048, "train/negative_loss": 1.1484401226043701, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0004604670684784651, "train/total_loss": 0.45082783699035645 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2730380594730377, "train/contrastive_loss": 1.5600128173828125, "train/negative_loss": 1.4715052843093872, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.08850748836994171, "train/total_loss": 0.5850406289100647 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2212018519639969, "train/contrastive_loss": 1.9971472024917603, "train/negative_loss": 1.3740453720092773, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.6231018304824829, "train/total_loss": 0.6206312775611877 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2970312535762787, "train/contrastive_loss": 2.325863838195801, "train/negative_loss": 1.122704267501831, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.2031596899032593, "train/total_loss": 0.7622040510177612 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.19004490971565247, "train/contrastive_loss": 3.3516011238098145, "train/negative_loss": 1.4583089351654053, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.8932920694351196, "train/total_loss": 0.8603651523590088 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.22262173891067505, "train/contrastive_loss": 2.6947569847106934, "train/negative_loss": 2.2964460849761963, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.39831095933914185, "train/total_loss": 0.7615731358528137 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2667829394340515, "train/contrastive_loss": 2.5166549682617188, "train/negative_loss": 2.516644239425659, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 1.0728893357736524e-05, "train/total_loss": 0.7701139450073242 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.20589295029640198, "train/contrastive_loss": 1.7858270406723022, "train/negative_loss": 1.328407883644104, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.45741915702819824, "train/total_loss": 0.5630583763122559 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.19719679653644562, "train/contrastive_loss": 0.6879628300666809, "train/negative_loss": 0.6219642758369446, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.06599855422973633, "train/total_loss": 0.33478936553001404 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.23205526173114777, "train/contrastive_loss": 0.7114622592926025, "train/negative_loss": 0.5853481888771057, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.12611407041549683, "train/total_loss": 0.3743477165699005 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.23155814409255981, "train/contrastive_loss": 1.034451961517334, "train/negative_loss": 0.8554577231407166, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.17899425327777863, "train/total_loss": 0.43844854831695557 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.3008689880371094, "train/contrastive_loss": 1.319309115409851, "train/negative_loss": 1.1135939359664917, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.205715149641037, "train/total_loss": 0.5647308230400085 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.16647109389305115, "train/contrastive_loss": 0.9486055970191956, "train/negative_loss": 0.8614486455917358, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.08715693652629852, "train/total_loss": 0.3561922311782837 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.15506407618522644, "train/contrastive_loss": 0.5729125142097473, "train/negative_loss": 0.3452664017677307, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.2276460975408554, "train/total_loss": 0.2696465849876404 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.19409959018230438, "train/contrastive_loss": 0.7444077134132385, "train/negative_loss": 0.7230579853057861, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.02134970761835575, "train/total_loss": 0.34298112988471985 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.22766001522541046, "train/contrastive_loss": 2.6191601753234863, "train/negative_loss": 1.266123652458191, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.3530365228652954, "train/total_loss": 0.7514920234680176 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.22966733574867249, "train/contrastive_loss": 0.7468936443328857, "train/negative_loss": 0.6868898272514343, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.060003843158483505, "train/total_loss": 0.37904608249664307 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.16529713571071625, "train/contrastive_loss": 0.5958980321884155, "train/negative_loss": 0.37662050127983093, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.2192775458097458, "train/total_loss": 0.28447675704956055 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2148972749710083, "train/contrastive_loss": 2.1638331413269043, "train/negative_loss": 1.1603425741195679, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.003490686416626, "train/total_loss": 0.647663950920105 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.27717262506484985, "train/contrastive_loss": 1.8546534776687622, "train/negative_loss": 1.818279504776001, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.03637393191456795, "train/total_loss": 0.6481033563613892 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.1601891815662384, "train/contrastive_loss": 2.100324869155884, "train/negative_loss": 1.5401709079742432, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.5601539611816406, "train/total_loss": 0.5802541971206665 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2267373651266098, "train/contrastive_loss": 2.0910134315490723, "train/negative_loss": 1.3800240755081177, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.7109894752502441, "train/total_loss": 0.6449400782585144 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.22092710435390472, "train/contrastive_loss": 1.2995631694793701, "train/negative_loss": 0.5123441815376282, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.7872190475463867, "train/total_loss": 0.48083972930908203 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.21065887808799744, "train/contrastive_loss": 5.21412992477417, "train/negative_loss": 5.214123725891113, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 6.163147190818563e-06, "train/total_loss": 1.2534849643707275 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.209507018327713, "train/contrastive_loss": 1.1888965368270874, "train/negative_loss": 0.6046951413154602, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.5842013955116272, "train/total_loss": 0.44728630781173706 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.24194557964801788, "train/contrastive_loss": 2.0317795276641846, "train/negative_loss": 1.567382574081421, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.4643968939781189, "train/total_loss": 0.6483014822006226 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.1839798092842102, "train/contrastive_loss": 3.1929068565368652, "train/negative_loss": 1.279168725013733, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.9137382507324219, "train/total_loss": 0.8225612044334412 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.2763615846633911, "train/contrastive_loss": 2.311007499694824, "train/negative_loss": 2.2773032188415527, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.033704303205013275, "train/total_loss": 0.738563060760498 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.21757225692272186, "train/contrastive_loss": 1.919898509979248, "train/negative_loss": 1.5635740756988525, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.35632437467575073, "train/total_loss": 0.6015519499778748 }, { "epoch": 4.929577464788732, "eval_exact_match_accuracy": 0.20634920634920634, "eval_hamming_loss": 0.0742815644776429, "eval_loss": 0.602698802947998, "eval_macro_f1": 0.18039899366294992, "eval_macro_precision": 0.26815441057420997, "eval_macro_recall": 0.1408294182448942, "eval_micro_f1": 0.42902711323763953, "eval_micro_precision": 0.8512658227848101, "eval_micro_recall": 0.2867803837953092, "eval_runtime": 2.8408, "eval_samples_per_second": 199.593, "eval_steps_per_second": 24.993, "step": 1400 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.22136974334716797, "train/contrastive_loss": 1.2682056427001953, "train/negative_loss": 1.1588491201400757, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.10935650765895844, "train/total_loss": 0.47501087188720703 }, { "epoch": 4.929577464788732, "step": 1400, "train/classification_loss": 0.19550098478794098, "train/contrastive_loss": 1.2021019458770752, "train/negative_loss": 1.0115691423416138, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.19053274393081665, "train/total_loss": 0.4359213709831238 }, { "epoch": 5.105633802816901, "grad_norm": 15.724308013916016, "learning_rate": 1.981028893587033e-05, "loss": 0.8954, "step": 1450 }, { "epoch": 5.105633802816901, "step": 1450, "train/classification_loss": 0.18994148075580597, "train/contrastive_loss": 1.1352885961532593, "train/negative_loss": 0.6845282912254333, "train/num_negatives": 32, "train/num_positives": 24, "train/positive_loss": 0.4507603347301483, "train/total_loss": 0.4169992208480835 }, { "epoch": 5.105633802816901, "step": 1450, "train/classification_loss": 0.22752925753593445, "train/contrastive_loss": 0.7950844764709473, "train/negative_loss": 0.7596084475517273, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.03547599911689758, "train/total_loss": 0.38654613494873047 }, { "epoch": 5.28169014084507, "grad_norm": 14.44680118560791, "learning_rate": 1.9803241719520793e-05, "loss": 0.8702, "step": 1500 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.22636128962039948, "train/contrastive_loss": 2.0414843559265137, "train/negative_loss": 1.6787714958190918, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.3627128601074219, "train/total_loss": 0.63465815782547 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2975652515888214, "train/contrastive_loss": 0.7430849671363831, "train/negative_loss": 0.6191623210906982, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.12392264604568481, "train/total_loss": 0.4461822509765625 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.26759234070777893, "train/contrastive_loss": 2.839524269104004, "train/negative_loss": 1.739831566810608, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.0996925830841064, "train/total_loss": 0.835497260093689 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.1427876055240631, "train/contrastive_loss": 0.6630963087081909, "train/negative_loss": 0.5745147466659546, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.08858159184455872, "train/total_loss": 0.2754068672657013 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.21467840671539307, "train/contrastive_loss": 2.688988208770752, "train/negative_loss": 2.3859636783599854, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.3030245006084442, "train/total_loss": 0.7524760365486145 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2218104600906372, "train/contrastive_loss": 2.84360408782959, "train/negative_loss": 1.8320857286453247, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.0115182399749756, "train/total_loss": 0.7905312776565552 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.22064198553562164, "train/contrastive_loss": 2.234194755554199, "train/negative_loss": 1.4630733728408813, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.7711214423179626, "train/total_loss": 0.6674809455871582 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.217738538980484, "train/contrastive_loss": 0.8700132966041565, "train/negative_loss": 0.8698275089263916, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.00018580493633635342, "train/total_loss": 0.39174121618270874 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.13523893058300018, "train/contrastive_loss": 0.6919322609901428, "train/negative_loss": 0.4435657262802124, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.24836653470993042, "train/total_loss": 0.27362537384033203 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.24660545587539673, "train/contrastive_loss": 2.9734978675842285, "train/negative_loss": 1.8433940410614014, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.1301038265228271, "train/total_loss": 0.8413050174713135 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.18715506792068481, "train/contrastive_loss": 2.116032123565674, "train/negative_loss": 1.181221604347229, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.9348105192184448, "train/total_loss": 0.6103614568710327 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.20544745028018951, "train/contrastive_loss": 1.607175588607788, "train/negative_loss": 1.1987271308898926, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.4084485173225403, "train/total_loss": 0.5268825888633728 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.22728942334651947, "train/contrastive_loss": 3.931039810180664, "train/negative_loss": 2.4261186122894287, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.5049210786819458, "train/total_loss": 1.0134973526000977 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2303304374217987, "train/contrastive_loss": 1.6849133968353271, "train/negative_loss": 1.6026890277862549, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.08222441375255585, "train/total_loss": 0.5673131346702576 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.1550561934709549, "train/contrastive_loss": 2.964245319366455, "train/negative_loss": 0.9514899253845215, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.0127553939819336, "train/total_loss": 0.7479052543640137 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2042667418718338, "train/contrastive_loss": 2.0260186195373535, "train/negative_loss": 1.2843199968338013, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.741698682308197, "train/total_loss": 0.6094704866409302 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.16754163801670074, "train/contrastive_loss": 1.4737792015075684, "train/negative_loss": 0.8898117542266846, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5839675068855286, "train/total_loss": 0.4622974991798401 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.21145936846733093, "train/contrastive_loss": 1.7176973819732666, "train/negative_loss": 0.9128689765930176, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.8048284649848938, "train/total_loss": 0.5549988746643066 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.20649760961532593, "train/contrastive_loss": 0.8787757158279419, "train/negative_loss": 0.3985722064971924, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.4802034795284271, "train/total_loss": 0.3822527527809143 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.19489778578281403, "train/contrastive_loss": 3.086888313293457, "train/negative_loss": 1.646887183189392, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.440001130104065, "train/total_loss": 0.8122754693031311 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.16930510103702545, "train/contrastive_loss": 1.041625738143921, "train/negative_loss": 0.9929075241088867, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.04871825501322746, "train/total_loss": 0.37763023376464844 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.14430966973304749, "train/contrastive_loss": 2.8742356300354004, "train/negative_loss": 1.8458573818206787, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0283783674240112, "train/total_loss": 0.7191568613052368 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.19273817539215088, "train/contrastive_loss": 2.236297369003296, "train/negative_loss": 1.3599917888641357, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.8763055801391602, "train/total_loss": 0.639997661113739 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.24937298893928528, "train/contrastive_loss": 2.778104066848755, "train/negative_loss": 1.426579236984253, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.351524829864502, "train/total_loss": 0.8049938678741455 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.18907541036605835, "train/contrastive_loss": 1.5253593921661377, "train/negative_loss": 0.7853926420211792, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.7399666905403137, "train/total_loss": 0.49414730072021484 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.22384776175022125, "train/contrastive_loss": 3.009986162185669, "train/negative_loss": 1.789249300956726, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.2207368612289429, "train/total_loss": 0.8258450031280518 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2237471491098404, "train/contrastive_loss": 1.8612817525863647, "train/negative_loss": 1.8601264953613281, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0011552752694115043, "train/total_loss": 0.596003532409668 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.20967324078083038, "train/contrastive_loss": 0.21053670346736908, "train/negative_loss": 0.19599571824073792, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.014540987089276314, "train/total_loss": 0.25178056955337524 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.25641560554504395, "train/contrastive_loss": 2.2025504112243652, "train/negative_loss": 1.0668914318084717, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.135659098625183, "train/total_loss": 0.696925699710846 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.23944158852100372, "train/contrastive_loss": 1.1535974740982056, "train/negative_loss": 1.1365643739700317, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.017033154144883156, "train/total_loss": 0.4701610803604126 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.16724729537963867, "train/contrastive_loss": 1.302540898323059, "train/negative_loss": 1.3008681535720825, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0016727934125810862, "train/total_loss": 0.4277554750442505 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.1996653825044632, "train/contrastive_loss": 3.8614325523376465, "train/negative_loss": 2.305530548095703, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.5559020042419434, "train/total_loss": 0.9719519019126892 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.21217036247253418, "train/contrastive_loss": 2.384697437286377, "train/negative_loss": 0.9175740480422974, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.4671235084533691, "train/total_loss": 0.6891098618507385 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2223367691040039, "train/contrastive_loss": 2.0807347297668457, "train/negative_loss": 1.5713911056518555, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.5093435645103455, "train/total_loss": 0.6384837627410889 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.25095394253730774, "train/contrastive_loss": 3.321063995361328, "train/negative_loss": 1.9911603927612305, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.329903483390808, "train/total_loss": 0.9151667356491089 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.1524108201265335, "train/contrastive_loss": 2.1531994342803955, "train/negative_loss": 2.153045177459717, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.0001543389807920903, "train/total_loss": 0.5830507278442383 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.21389931440353394, "train/contrastive_loss": 1.0181796550750732, "train/negative_loss": 0.6149943470954895, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.40318524837493896, "train/total_loss": 0.4175352454185486 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.27000924944877625, "train/contrastive_loss": 2.7042622566223145, "train/negative_loss": 2.2667722702026367, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.43748992681503296, "train/total_loss": 0.8108617067337036 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.21009594202041626, "train/contrastive_loss": 0.4851546883583069, "train/negative_loss": 0.38059118390083313, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.10456349700689316, "train/total_loss": 0.30712687969207764 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2787434160709381, "train/contrastive_loss": 3.513895034790039, "train/negative_loss": 2.2333409786224365, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.280554175376892, "train/total_loss": 0.9815224409103394 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.15372511744499207, "train/contrastive_loss": 1.4948574304580688, "train/negative_loss": 0.8530688285827637, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.6417886018753052, "train/total_loss": 0.45269662141799927 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.1950065940618515, "train/contrastive_loss": 3.4712212085723877, "train/negative_loss": 2.2971549034118652, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.1740663051605225, "train/total_loss": 0.8892508745193481 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.21279451251029968, "train/contrastive_loss": 1.0096569061279297, "train/negative_loss": 1.0092675685882568, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0003893813118338585, "train/total_loss": 0.4147258996963501 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2675437331199646, "train/contrastive_loss": 1.8837124109268188, "train/negative_loss": 1.8820476531982422, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.0016647394513711333, "train/total_loss": 0.6442862153053284 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.21745339035987854, "train/contrastive_loss": 0.950171172618866, "train/negative_loss": 0.6876944899559021, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.26247668266296387, "train/total_loss": 0.4074876308441162 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.3117443025112152, "train/contrastive_loss": 2.8014614582061768, "train/negative_loss": 2.127279043197632, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.6741823554039001, "train/total_loss": 0.8720365762710571 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.17777502536773682, "train/contrastive_loss": 1.4357764720916748, "train/negative_loss": 1.0680173635482788, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.36775916814804077, "train/total_loss": 0.46493032574653625 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.22267363965511322, "train/contrastive_loss": 2.5921692848205566, "train/negative_loss": 1.7946677207946777, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7975016236305237, "train/total_loss": 0.7411075234413147 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2684362232685089, "train/contrastive_loss": 2.321204900741577, "train/negative_loss": 2.321115493774414, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 8.929174509830773e-05, "train/total_loss": 0.7326772212982178 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.19712282717227936, "train/contrastive_loss": 2.233785390853882, "train/negative_loss": 1.603864312171936, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.629921019077301, "train/total_loss": 0.6438798904418945 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.1858803778886795, "train/contrastive_loss": 0.6894663572311401, "train/negative_loss": 0.44342461228370667, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.24604175984859467, "train/total_loss": 0.32377365231513977 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.24126358330249786, "train/contrastive_loss": 0.5397908091545105, "train/negative_loss": 0.47343602776527405, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.06635475903749466, "train/total_loss": 0.34922173619270325 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.22538423538208008, "train/contrastive_loss": 1.0500423908233643, "train/negative_loss": 0.770239531993866, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.2798028886318207, "train/total_loss": 0.43539273738861084 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.3079920709133148, "train/contrastive_loss": 1.9762444496154785, "train/negative_loss": 1.3747068643569946, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.6015375256538391, "train/total_loss": 0.7032409906387329 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.1529608517885208, "train/contrastive_loss": 0.5382075905799866, "train/negative_loss": 0.5331097841262817, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.005097777582705021, "train/total_loss": 0.26060235500335693 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.1508939117193222, "train/contrastive_loss": 0.7440985441207886, "train/negative_loss": 0.2530116140842438, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.4910869300365448, "train/total_loss": 0.2997136116027832 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.1866835653781891, "train/contrastive_loss": 0.9746546745300293, "train/negative_loss": 0.906044602394104, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.0686100572347641, "train/total_loss": 0.3816145062446594 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2201661467552185, "train/contrastive_loss": 2.9372711181640625, "train/negative_loss": 1.0342472791671753, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.9030237197875977, "train/total_loss": 0.8076204061508179 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.22550223767757416, "train/contrastive_loss": 1.3420944213867188, "train/negative_loss": 1.223663568496704, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.11843083798885345, "train/total_loss": 0.49392110109329224 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.15391422808170319, "train/contrastive_loss": 0.3427361845970154, "train/negative_loss": 0.18869996070861816, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.15403620898723602, "train/total_loss": 0.22246146202087402 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.20097817480564117, "train/contrastive_loss": 2.4801955223083496, "train/negative_loss": 1.040342926979065, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.4398527145385742, "train/total_loss": 0.6970173120498657 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2750329375267029, "train/contrastive_loss": 2.6431326866149902, "train/negative_loss": 2.556562662124634, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.0865701362490654, "train/total_loss": 0.8036594986915588 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.16166841983795166, "train/contrastive_loss": 3.3219175338745117, "train/negative_loss": 1.5956919193267822, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.726225733757019, "train/total_loss": 0.8260519504547119 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.22442971169948578, "train/contrastive_loss": 1.8916311264038086, "train/negative_loss": 1.7948410511016846, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.09679010510444641, "train/total_loss": 0.6027559638023376 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.21694506704807281, "train/contrastive_loss": 1.2165296077728271, "train/negative_loss": 0.7232502102851868, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.4932793378829956, "train/total_loss": 0.46025097370147705 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.20899632573127747, "train/contrastive_loss": 5.260756969451904, "train/negative_loss": 5.260749816894531, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 7.224129603855545e-06, "train/total_loss": 1.2611477375030518 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.20686830580234528, "train/contrastive_loss": 0.7166347503662109, "train/negative_loss": 0.3884955048561096, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.3281392753124237, "train/total_loss": 0.3501952588558197 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.2344495803117752, "train/contrastive_loss": 2.4842820167541504, "train/negative_loss": 1.4722728729248047, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0120090246200562, "train/total_loss": 0.7313060164451599 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.17630720138549805, "train/contrastive_loss": 2.585228204727173, "train/negative_loss": 1.4172074794769287, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.1680207252502441, "train/total_loss": 0.6933528780937195 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.26748135685920715, "train/contrastive_loss": 2.0368354320526123, "train/negative_loss": 1.9325711727142334, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.1042642742395401, "train/total_loss": 0.6748484373092651 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.20691922307014465, "train/contrastive_loss": 0.979591429233551, "train/negative_loss": 0.8532407879829407, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.12635065615177155, "train/total_loss": 0.40283751487731934 }, { "epoch": 5.28169014084507, "eval_exact_match_accuracy": 0.2239858906525573, "eval_hamming_loss": 0.07262164124909223, "eval_loss": 0.6040080785751343, "eval_macro_f1": 0.19772493885278988, "eval_macro_precision": 0.3197474920333325, "eval_macro_recall": 0.15588829677088895, "eval_micro_f1": 0.45054945054945056, "eval_micro_precision": 0.8541666666666666, "eval_micro_recall": 0.30597014925373134, "eval_runtime": 2.8406, "eval_samples_per_second": 199.605, "eval_steps_per_second": 24.995, "step": 1500 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.21017411351203918, "train/contrastive_loss": 1.1640411615371704, "train/negative_loss": 0.8045998811721802, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.35944128036499023, "train/total_loss": 0.44298234581947327 }, { "epoch": 5.28169014084507, "step": 1500, "train/classification_loss": 0.21734820306301117, "train/contrastive_loss": 0.6913052201271057, "train/negative_loss": 0.6011077761650085, "train/num_negatives": 36, "train/num_positives": 16, "train/positive_loss": 0.09019742906093597, "train/total_loss": 0.3556092381477356 }, { "epoch": 5.457746478873239, "grad_norm": 11.561055183410645, "learning_rate": 1.9796194503171248e-05, "loss": 0.8382, "step": 1550 }, { "epoch": 5.457746478873239, "step": 1550, "train/classification_loss": 0.22216124832630157, "train/contrastive_loss": 1.2040032148361206, "train/negative_loss": 0.7773630023002625, "train/num_negatives": 24, "train/num_positives": 18, "train/positive_loss": 0.42664018273353577, "train/total_loss": 0.46296191215515137 }, { "epoch": 5.457746478873239, "step": 1550, "train/classification_loss": 0.25321558117866516, "train/contrastive_loss": 1.0504286289215088, "train/negative_loss": 0.7849107980728149, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.2655177712440491, "train/total_loss": 0.46330130100250244 }, { "epoch": 5.633802816901408, "grad_norm": 16.24932861328125, "learning_rate": 1.9789147286821706e-05, "loss": 0.8582, "step": 1600 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.23702077567577362, "train/contrastive_loss": 1.6451088190078735, "train/negative_loss": 1.5508790016174316, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.09422986209392548, "train/total_loss": 0.5660425424575806 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2807944416999817, "train/contrastive_loss": 1.4290659427642822, "train/negative_loss": 0.5341874361038208, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.8948785662651062, "train/total_loss": 0.5666075944900513 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2671695053577423, "train/contrastive_loss": 2.3894972801208496, "train/negative_loss": 1.2943984270095825, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.0950989723205566, "train/total_loss": 0.7450689673423767 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.13481146097183228, "train/contrastive_loss": 0.5420774221420288, "train/negative_loss": 0.48649072647094727, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.055586669594049454, "train/total_loss": 0.24322694540023804 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.21328222751617432, "train/contrastive_loss": 2.6036579608917236, "train/negative_loss": 2.0069971084594727, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.596660852432251, "train/total_loss": 0.7340138554573059 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.21861054003238678, "train/contrastive_loss": 2.874683141708374, "train/negative_loss": 1.37449312210083, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.500190019607544, "train/total_loss": 0.7935471534729004 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2072199136018753, "train/contrastive_loss": 2.2234437465667725, "train/negative_loss": 1.3584762811660767, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.864967405796051, "train/total_loss": 0.6519086956977844 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2144571840763092, "train/contrastive_loss": 0.7091529369354248, "train/negative_loss": 0.7090263366699219, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.00012660828360822052, "train/total_loss": 0.35628777742385864 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.1336527317762375, "train/contrastive_loss": 1.205674409866333, "train/negative_loss": 0.4180910587310791, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.7875833511352539, "train/total_loss": 0.3747876286506653 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.22610506415367126, "train/contrastive_loss": 3.4279775619506836, "train/negative_loss": 1.413112998008728, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 2.014864683151245, "train/total_loss": 0.9117006063461304 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.1818275898694992, "train/contrastive_loss": 2.3474843502044678, "train/negative_loss": 1.0960769653320312, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 1.2514073848724365, "train/total_loss": 0.651324450969696 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.19788329303264618, "train/contrastive_loss": 0.7274901866912842, "train/negative_loss": 0.726530909538269, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.0009592588758096099, "train/total_loss": 0.3433813452720642 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.22228887677192688, "train/contrastive_loss": 3.467336654663086, "train/negative_loss": 2.3886945247650146, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0786421298980713, "train/total_loss": 0.9157562255859375 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.22804833948612213, "train/contrastive_loss": 1.145745038986206, "train/negative_loss": 1.0951086282730103, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.0506364107131958, "train/total_loss": 0.457197368144989 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.15663203597068787, "train/contrastive_loss": 3.1898193359375, "train/negative_loss": 0.8811120390892029, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.3087072372436523, "train/total_loss": 0.7945959568023682 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20080019533634186, "train/contrastive_loss": 2.1944327354431152, "train/negative_loss": 1.15549635887146, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.0389363765716553, "train/total_loss": 0.6396867632865906 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.16196012496948242, "train/contrastive_loss": 1.927802324295044, "train/negative_loss": 1.0773741006851196, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.8504282236099243, "train/total_loss": 0.547520637512207 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20059916377067566, "train/contrastive_loss": 1.8498501777648926, "train/negative_loss": 1.4267992973327637, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.4230509400367737, "train/total_loss": 0.5705692172050476 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.19621223211288452, "train/contrastive_loss": 0.8714191913604736, "train/negative_loss": 0.5153063535690308, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.3561128079891205, "train/total_loss": 0.37049609422683716 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.19108864665031433, "train/contrastive_loss": 2.732180595397949, "train/negative_loss": 1.5897300243377686, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.1424506902694702, "train/total_loss": 0.7375247478485107 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.16884231567382812, "train/contrastive_loss": 0.8711749911308289, "train/negative_loss": 0.8151357769966125, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.05603921413421631, "train/total_loss": 0.34307730197906494 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.14346754550933838, "train/contrastive_loss": 3.257957696914673, "train/negative_loss": 2.0725789070129395, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.1853787899017334, "train/total_loss": 0.795059084892273 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.18945926427841187, "train/contrastive_loss": 2.7343173027038574, "train/negative_loss": 0.8981912136077881, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.8361260890960693, "train/total_loss": 0.7363227605819702 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.24139651656150818, "train/contrastive_loss": 2.6334381103515625, "train/negative_loss": 1.2412890195846558, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.3921489715576172, "train/total_loss": 0.7680841684341431 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.19805581867694855, "train/contrastive_loss": 2.717120885848999, "train/negative_loss": 0.8351744413375854, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.8819464445114136, "train/total_loss": 0.7414799928665161 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.22040274739265442, "train/contrastive_loss": 2.877885580062866, "train/negative_loss": 2.0133190155029297, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8645665645599365, "train/total_loss": 0.7959798574447632 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.21370400488376617, "train/contrastive_loss": 1.2733008861541748, "train/negative_loss": 1.272513508796692, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0007874318398535252, "train/total_loss": 0.4683641791343689 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20344698429107666, "train/contrastive_loss": 0.1555728167295456, "train/negative_loss": 0.143561452627182, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.01201136689633131, "train/total_loss": 0.23456154763698578 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.25167909264564514, "train/contrastive_loss": 3.0801098346710205, "train/negative_loss": 1.464032769203186, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.6160770654678345, "train/total_loss": 0.8677010536193848 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.22584731876850128, "train/contrastive_loss": 0.5820425152778625, "train/negative_loss": 0.4849640727043152, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.09707845747470856, "train/total_loss": 0.3422558307647705 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.165061816573143, "train/contrastive_loss": 0.9276313781738281, "train/negative_loss": 0.9270414113998413, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0005899504176340997, "train/total_loss": 0.3505880832672119 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.19334378838539124, "train/contrastive_loss": 3.6510744094848633, "train/negative_loss": 1.8619177341461182, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.7891566753387451, "train/total_loss": 0.9235587120056152 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2063838392496109, "train/contrastive_loss": 2.273486614227295, "train/negative_loss": 1.0990484952926636, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.174438238143921, "train/total_loss": 0.6610811948776245 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.22358667850494385, "train/contrastive_loss": 1.647292137145996, "train/negative_loss": 1.556389570236206, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.09090255945920944, "train/total_loss": 0.5530451536178589 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.24036137759685516, "train/contrastive_loss": 2.812830924987793, "train/negative_loss": 1.8549643754959106, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.9578665494918823, "train/total_loss": 0.8029276132583618 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.15133407711982727, "train/contrastive_loss": 1.9341228008270264, "train/negative_loss": 1.9336551427841187, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.0004676328389905393, "train/total_loss": 0.538158655166626 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2138678878545761, "train/contrastive_loss": 0.9629563093185425, "train/negative_loss": 0.45816758275032043, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.5047887563705444, "train/total_loss": 0.40645915269851685 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2579900622367859, "train/contrastive_loss": 4.260730266571045, "train/negative_loss": 4.012881755828857, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.24784834682941437, "train/total_loss": 1.1101361513137817 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2206651121377945, "train/contrastive_loss": 1.5702457427978516, "train/negative_loss": 0.9921298623085022, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.5781158804893494, "train/total_loss": 0.5347142815589905 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2739638388156891, "train/contrastive_loss": 3.6081268787384033, "train/negative_loss": 2.3873746395111084, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.220752239227295, "train/total_loss": 0.9955892562866211 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.1533750593662262, "train/contrastive_loss": 1.613090991973877, "train/negative_loss": 0.8586022257804871, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.7544887065887451, "train/total_loss": 0.475993275642395 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20242871344089508, "train/contrastive_loss": 3.991438150405884, "train/negative_loss": 2.162257194519043, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.8291809558868408, "train/total_loss": 1.0007163286209106 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20762135088443756, "train/contrastive_loss": 1.1606533527374268, "train/negative_loss": 1.1593447923660278, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0013085369719192386, "train/total_loss": 0.4397520422935486 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2719421088695526, "train/contrastive_loss": 1.808800220489502, "train/negative_loss": 1.7140024900436401, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.09479769319295883, "train/total_loss": 0.6337021589279175 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20392394065856934, "train/contrastive_loss": 0.8441608548164368, "train/negative_loss": 0.6126073002815247, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.2315535545349121, "train/total_loss": 0.37275612354278564 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.3177470862865448, "train/contrastive_loss": 3.02396559715271, "train/negative_loss": 2.4306905269622803, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.5932750105857849, "train/total_loss": 0.9225401878356934 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.17588309943675995, "train/contrastive_loss": 1.8991339206695557, "train/negative_loss": 0.9913210272789001, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.9078129529953003, "train/total_loss": 0.5557098984718323 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.21649636328220367, "train/contrastive_loss": 2.3409266471862793, "train/negative_loss": 2.0015835762023926, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.33934295177459717, "train/total_loss": 0.6846817135810852 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2586718797683716, "train/contrastive_loss": 2.231245517730713, "train/negative_loss": 2.2312281131744385, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 1.7404707250534557e-05, "train/total_loss": 0.7049210071563721 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.2034951001405716, "train/contrastive_loss": 2.8478569984436035, "train/negative_loss": 1.6936752796173096, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.1541815996170044, "train/total_loss": 0.773066520690918 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.18201115727424622, "train/contrastive_loss": 1.479737639427185, "train/negative_loss": 0.9148036241531372, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.5649340152740479, "train/total_loss": 0.47795867919921875 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.22470872104167938, "train/contrastive_loss": 0.9826817512512207, "train/negative_loss": 0.7071917057037354, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.27549004554748535, "train/total_loss": 0.4212450683116913 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.22552569210529327, "train/contrastive_loss": 1.206992506980896, "train/negative_loss": 0.7897206544876099, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.4172718822956085, "train/total_loss": 0.46692419052124023 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.3138810694217682, "train/contrastive_loss": 2.2114133834838867, "train/negative_loss": 1.7286598682403564, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.4827536344528198, "train/total_loss": 0.7561637163162231 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.1525324434041977, "train/contrastive_loss": 0.8160380125045776, "train/negative_loss": 0.6123915910720825, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.20364642143249512, "train/total_loss": 0.31574004888534546 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.15518178045749664, "train/contrastive_loss": 0.9236260652542114, "train/negative_loss": 0.33020737767219543, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.5934186577796936, "train/total_loss": 0.3399069905281067 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.18703415989875793, "train/contrastive_loss": 0.9746322631835938, "train/negative_loss": 0.7493367195129395, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.22529557347297668, "train/total_loss": 0.3819606304168701 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20868200063705444, "train/contrastive_loss": 2.178956985473633, "train/negative_loss": 1.1348897218704224, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.044067144393921, "train/total_loss": 0.6444734334945679 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.22476527094841003, "train/contrastive_loss": 1.185799241065979, "train/negative_loss": 0.9723201394081116, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.21347910165786743, "train/total_loss": 0.46192511916160583 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.1576899141073227, "train/contrastive_loss": 0.6182948350906372, "train/negative_loss": 0.3953501880168915, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.22294463217258453, "train/total_loss": 0.2813488841056824 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.19558343291282654, "train/contrastive_loss": 1.8985164165496826, "train/negative_loss": 0.9347307085990906, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.9637857675552368, "train/total_loss": 0.5752867460250854 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.27345722913742065, "train/contrastive_loss": 2.0676190853118896, "train/negative_loss": 2.062793254852295, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.004825713578611612, "train/total_loss": 0.6869810819625854 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.15852481126785278, "train/contrastive_loss": 2.91733980178833, "train/negative_loss": 1.1113064289093018, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.8060334920883179, "train/total_loss": 0.7419927716255188 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.21702103316783905, "train/contrastive_loss": 1.9533376693725586, "train/negative_loss": 1.8773987293243408, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.07593892514705658, "train/total_loss": 0.6076885461807251 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20359709858894348, "train/contrastive_loss": 2.540095806121826, "train/negative_loss": 0.6672948598861694, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.8728008270263672, "train/total_loss": 0.7116162776947021 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20051588118076324, "train/contrastive_loss": 4.684122085571289, "train/negative_loss": 4.684116363525391, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 5.686307304131333e-06, "train/total_loss": 1.1373403072357178 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20230109989643097, "train/contrastive_loss": 0.7998157739639282, "train/negative_loss": 0.5881301164627075, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.2116856873035431, "train/total_loss": 0.3622642755508423 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.22185884416103363, "train/contrastive_loss": 2.8162074089050293, "train/negative_loss": 1.118725061416626, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.6974823474884033, "train/total_loss": 0.7851003408432007 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.17553521692752838, "train/contrastive_loss": 2.298393487930298, "train/negative_loss": 1.1296616792678833, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.1687318086624146, "train/total_loss": 0.6352139115333557 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.25741371512413025, "train/contrastive_loss": 1.8554365634918213, "train/negative_loss": 1.36845064163208, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.4869858920574188, "train/total_loss": 0.6285010576248169 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.1986110359430313, "train/contrastive_loss": 0.9597651958465576, "train/negative_loss": 0.6958547830581665, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.2639104127883911, "train/total_loss": 0.39056408405303955 }, { "epoch": 5.633802816901408, "eval_exact_match_accuracy": 0.2292768959435626, "eval_hamming_loss": 0.07293287685444548, "eval_loss": 0.6104494333267212, "eval_macro_f1": 0.21772971254811033, "eval_macro_precision": 0.3684285285076008, "eval_macro_recall": 0.1696943358517272, "eval_micro_f1": 0.45120999219359875, "eval_micro_precision": 0.8425655976676385, "eval_micro_recall": 0.30810234541577824, "eval_runtime": 2.8442, "eval_samples_per_second": 199.356, "eval_steps_per_second": 24.963, "step": 1600 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.19540128111839294, "train/contrastive_loss": 1.2757567167282104, "train/negative_loss": 1.1663979291915894, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.1093587651848793, "train/total_loss": 0.45055264234542847 }, { "epoch": 5.633802816901408, "step": 1600, "train/classification_loss": 0.20016218721866608, "train/contrastive_loss": 1.5143775939941406, "train/negative_loss": 1.4740484952926636, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.040329139679670334, "train/total_loss": 0.503037691116333 }, { "epoch": 5.809859154929578, "grad_norm": 12.960160255432129, "learning_rate": 1.9782100070472167e-05, "loss": 0.9118, "step": 1650 }, { "epoch": 5.809859154929578, "step": 1650, "train/classification_loss": 0.19248813390731812, "train/contrastive_loss": 0.9245613217353821, "train/negative_loss": 0.8709220886230469, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.05363922193646431, "train/total_loss": 0.37740039825439453 }, { "epoch": 5.809859154929578, "step": 1650, "train/classification_loss": 0.20316040515899658, "train/contrastive_loss": 1.0644290447235107, "train/negative_loss": 0.5469610095024109, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.5174680352210999, "train/total_loss": 0.4160462021827698 }, { "epoch": 5.985915492957746, "grad_norm": 12.231520652770996, "learning_rate": 1.977505285412262e-05, "loss": 0.8783, "step": 1700 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.221462219953537, "train/contrastive_loss": 2.4590988159179688, "train/negative_loss": 1.7600843906402588, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.6990143656730652, "train/total_loss": 0.7132819890975952 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.26578959822654724, "train/contrastive_loss": 1.0746912956237793, "train/negative_loss": 0.6682382225990295, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.40645313262939453, "train/total_loss": 0.4807278513908386 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.26474907994270325, "train/contrastive_loss": 3.065286636352539, "train/negative_loss": 1.94959557056427, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.115691065788269, "train/total_loss": 0.8778064250946045 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.14364959299564362, "train/contrastive_loss": 0.9807185530662537, "train/negative_loss": 0.8213047981262207, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.15941375494003296, "train/total_loss": 0.33979332447052 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.2084214836359024, "train/contrastive_loss": 2.3200767040252686, "train/negative_loss": 2.0234482288360596, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.296628475189209, "train/total_loss": 0.6724368333816528 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.2177915722131729, "train/contrastive_loss": 2.948605537414551, "train/negative_loss": 1.6253365278244019, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.3232691287994385, "train/total_loss": 0.8075127005577087 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.21262404322624207, "train/contrastive_loss": 2.0823614597320557, "train/negative_loss": 1.1420468091964722, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.9403145909309387, "train/total_loss": 0.6290963292121887 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.21171583235263824, "train/contrastive_loss": 1.133407711982727, "train/negative_loss": 1.132680892944336, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.0007267850451171398, "train/total_loss": 0.4383973777294159 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.13563896715641022, "train/contrastive_loss": 0.6403701305389404, "train/negative_loss": 0.40667724609375, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.23369285464286804, "train/total_loss": 0.263713002204895 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.2288937270641327, "train/contrastive_loss": 2.151214599609375, "train/negative_loss": 0.9454410076141357, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.2057735919952393, "train/total_loss": 0.6591366529464722 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.17437100410461426, "train/contrastive_loss": 1.8770527839660645, "train/negative_loss": 0.830203115940094, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 1.0468497276306152, "train/total_loss": 0.5497815608978271 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.19360946118831635, "train/contrastive_loss": 1.2126843929290771, "train/negative_loss": 1.2080878019332886, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.00459654163569212, "train/total_loss": 0.4361463487148285 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.21134503185749054, "train/contrastive_loss": 3.1952462196350098, "train/negative_loss": 1.8184351921081543, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.376810908317566, "train/total_loss": 0.8503942489624023 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.20954521000385284, "train/contrastive_loss": 2.272305727005005, "train/negative_loss": 1.4754786491394043, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.7968271374702454, "train/total_loss": 0.6640063524246216 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1568308174610138, "train/contrastive_loss": 3.2329628467559814, "train/negative_loss": 0.8909221291542053, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.342040777206421, "train/total_loss": 0.8034234046936035 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.18643267452716827, "train/contrastive_loss": 1.139142632484436, "train/negative_loss": 0.6296855211257935, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.5094571113586426, "train/total_loss": 0.41426122188568115 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.15659183263778687, "train/contrastive_loss": 1.1242566108703613, "train/negative_loss": 0.5465371608734131, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.577719509601593, "train/total_loss": 0.3814431428909302 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.21117204427719116, "train/contrastive_loss": 1.4498136043548584, "train/negative_loss": 0.9634303450584412, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.4863832890987396, "train/total_loss": 0.5011347532272339 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1872931718826294, "train/contrastive_loss": 0.803306519985199, "train/negative_loss": 0.5756934881210327, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.22761301696300507, "train/total_loss": 0.34795448184013367 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.19166812300682068, "train/contrastive_loss": 3.7552285194396973, "train/negative_loss": 1.8110504150390625, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.9441779851913452, "train/total_loss": 0.9427138566970825 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1606128066778183, "train/contrastive_loss": 1.4483282566070557, "train/negative_loss": 1.387937307357788, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.06039094552397728, "train/total_loss": 0.45027846097946167 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.13656173646450043, "train/contrastive_loss": 2.849153518676758, "train/negative_loss": 2.0549163818359375, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.7942370176315308, "train/total_loss": 0.7063924670219421 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1886182427406311, "train/contrastive_loss": 3.554659366607666, "train/negative_loss": 1.2033625841140747, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 2.3512966632843018, "train/total_loss": 0.8995501399040222 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.2407016158103943, "train/contrastive_loss": 2.665372133255005, "train/negative_loss": 1.462630033493042, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.202742099761963, "train/total_loss": 0.7737760543823242 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1961059272289276, "train/contrastive_loss": 2.311809539794922, "train/negative_loss": 1.3634473085403442, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.9483621716499329, "train/total_loss": 0.6584678292274475 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.20183724164962769, "train/contrastive_loss": 2.424044609069824, "train/negative_loss": 1.7180655002593994, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.70597904920578, "train/total_loss": 0.6866461634635925 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.21263127028942108, "train/contrastive_loss": 2.2292354106903076, "train/negative_loss": 2.2167515754699707, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.012483775615692139, "train/total_loss": 0.6584783792495728 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.19967931509017944, "train/contrastive_loss": 0.4156442880630493, "train/negative_loss": 0.4051029086112976, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.010541382245719433, "train/total_loss": 0.28280818462371826 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.24373365938663483, "train/contrastive_loss": 3.2246389389038086, "train/negative_loss": 1.6302928924560547, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.594346046447754, "train/total_loss": 0.8886614441871643 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.22044453024864197, "train/contrastive_loss": 1.211272120475769, "train/negative_loss": 1.0419281721115112, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.1693439483642578, "train/total_loss": 0.46269893646240234 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1694960594177246, "train/contrastive_loss": 0.7772913575172424, "train/negative_loss": 0.6609813570976257, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.1163100153207779, "train/total_loss": 0.3249543309211731 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.19062626361846924, "train/contrastive_loss": 3.0883870124816895, "train/negative_loss": 1.5537185668945312, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.5346685647964478, "train/total_loss": 0.8083036541938782 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.20361821353435516, "train/contrastive_loss": 1.8659075498580933, "train/negative_loss": 1.1411710977554321, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.7247364521026611, "train/total_loss": 0.576799750328064 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.21600548923015594, "train/contrastive_loss": 1.862668752670288, "train/negative_loss": 1.6935091018676758, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.16915962100028992, "train/total_loss": 0.5885392427444458 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.24313080310821533, "train/contrastive_loss": 2.2547178268432617, "train/negative_loss": 1.174124002456665, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.0805939435958862, "train/total_loss": 0.6940743923187256 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.14961303770542145, "train/contrastive_loss": 2.239539861679077, "train/negative_loss": 2.2394859790802, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 5.387864075601101e-05, "train/total_loss": 0.5975210070610046 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.19872525334358215, "train/contrastive_loss": 0.8004911541938782, "train/negative_loss": 0.7016170620918274, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.09887408465147018, "train/total_loss": 0.3588234782218933 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.2644781768321991, "train/contrastive_loss": 2.931800365447998, "train/negative_loss": 2.60398268699646, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.3278176784515381, "train/total_loss": 0.850838303565979 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.20335166156291962, "train/contrastive_loss": 0.6078771352767944, "train/negative_loss": 0.4523654878139496, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.15551163256168365, "train/total_loss": 0.32492709159851074 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.2844522297382355, "train/contrastive_loss": 4.9069600105285645, "train/negative_loss": 2.1426827907562256, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.764277219772339, "train/total_loss": 1.2658442258834839 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1465490609407425, "train/contrastive_loss": 0.670142412185669, "train/negative_loss": 0.4068988859653473, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.26324349641799927, "train/total_loss": 0.28057754039764404 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1882716566324234, "train/contrastive_loss": 2.1887221336364746, "train/negative_loss": 0.973315417766571, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.2154067754745483, "train/total_loss": 0.6260160803794861 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.2017248421907425, "train/contrastive_loss": 1.0781397819519043, "train/negative_loss": 1.0779799222946167, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.00015984913625288755, "train/total_loss": 0.4173527956008911 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.264041006565094, "train/contrastive_loss": 1.027521014213562, "train/negative_loss": 0.9978155493736267, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.029705418273806572, "train/total_loss": 0.4695452153682709 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.19865308701992035, "train/contrastive_loss": 1.1342270374298096, "train/negative_loss": 0.6809921264648438, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.4532349109649658, "train/total_loss": 0.42549848556518555 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.3010791838169098, "train/contrastive_loss": 2.9710891246795654, "train/negative_loss": 2.2176454067230225, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.753443717956543, "train/total_loss": 0.8952970504760742 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.17824791371822357, "train/contrastive_loss": 1.940492868423462, "train/negative_loss": 1.0547819137573242, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.8857110142707825, "train/total_loss": 0.5663464665412903 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.21051530539989471, "train/contrastive_loss": 2.504512071609497, "train/negative_loss": 2.1072912216186523, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.39722082018852234, "train/total_loss": 0.7114177346229553 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.2624529302120209, "train/contrastive_loss": 2.2317891120910645, "train/negative_loss": 2.2316646575927734, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.00012446223990991712, "train/total_loss": 0.7088107466697693 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.19717855751514435, "train/contrastive_loss": 1.9128272533416748, "train/negative_loss": 1.188171625137329, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.7246555685997009, "train/total_loss": 0.5797440409660339 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1748032420873642, "train/contrastive_loss": 0.8358477354049683, "train/negative_loss": 0.5673885941505432, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.26845914125442505, "train/total_loss": 0.34197279810905457 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.22560089826583862, "train/contrastive_loss": 0.820905864238739, "train/negative_loss": 0.6663085222244263, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.15459734201431274, "train/total_loss": 0.3897820711135864 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.21513667702674866, "train/contrastive_loss": 0.9757977724075317, "train/negative_loss": 0.7348029613494873, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.24099482595920563, "train/total_loss": 0.410296231508255 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.30533134937286377, "train/contrastive_loss": 2.474186897277832, "train/negative_loss": 1.445794701576233, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.0283920764923096, "train/total_loss": 0.8001687526702881 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1487395316362381, "train/contrastive_loss": 0.9981712102890015, "train/negative_loss": 0.6140452027320862, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.38412603735923767, "train/total_loss": 0.34837377071380615 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1429874449968338, "train/contrastive_loss": 0.6080282330513, "train/negative_loss": 0.30353280901908875, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.3044954240322113, "train/total_loss": 0.26459309458732605 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.17727260291576385, "train/contrastive_loss": 1.2232487201690674, "train/negative_loss": 1.0168335437774658, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.20641522109508514, "train/total_loss": 0.42192235589027405 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.21506135165691376, "train/contrastive_loss": 2.62617564201355, "train/negative_loss": 1.3170585632324219, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.309117078781128, "train/total_loss": 0.740296483039856 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.22454994916915894, "train/contrastive_loss": 1.4407482147216797, "train/negative_loss": 1.1716587543487549, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.2690894603729248, "train/total_loss": 0.5126996040344238 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.1419769525527954, "train/contrastive_loss": 0.2084272801876068, "train/negative_loss": 0.143569216132164, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.06485805660486221, "train/total_loss": 0.18366241455078125 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.20207370817661285, "train/contrastive_loss": 3.027205467224121, "train/negative_loss": 1.172908902168274, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.8542965650558472, "train/total_loss": 0.8075147867202759 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.2549789845943451, "train/contrastive_loss": 1.9599878787994385, "train/negative_loss": 1.1245739459991455, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.8354139924049377, "train/total_loss": 0.6469765901565552 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.15109749138355255, "train/contrastive_loss": 2.3361682891845703, "train/negative_loss": 1.2406820058822632, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.0954861640930176, "train/total_loss": 0.6183311343193054 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.21592342853546143, "train/contrastive_loss": 0.8044255375862122, "train/negative_loss": 0.6018489003181458, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.2025766223669052, "train/total_loss": 0.3768085241317749 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.20050044357776642, "train/contrastive_loss": 1.799804925918579, "train/negative_loss": 0.44646501541137695, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.3533399105072021, "train/total_loss": 0.5604614615440369 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.19952112436294556, "train/contrastive_loss": 3.3044862747192383, "train/negative_loss": 3.3044817447662354, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 4.446522780199302e-06, "train/total_loss": 0.8604183793067932 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.19301091134548187, "train/contrastive_loss": 0.9563617706298828, "train/negative_loss": 0.7286988496780396, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.22766292095184326, "train/total_loss": 0.38428327441215515 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.22885334491729736, "train/contrastive_loss": 2.997878074645996, "train/negative_loss": 1.434131383895874, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.5637468099594116, "train/total_loss": 0.8284289836883545 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.17190083861351013, "train/contrastive_loss": 3.1119890213012695, "train/negative_loss": 1.4986212253570557, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.6133679151535034, "train/total_loss": 0.7942986488342285 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.2603514492511749, "train/contrastive_loss": 2.2727572917938232, "train/negative_loss": 1.4112029075622559, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.8615543842315674, "train/total_loss": 0.7149028778076172 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.19999635219573975, "train/contrastive_loss": 1.228564739227295, "train/negative_loss": 0.6873701214790344, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.5411945581436157, "train/total_loss": 0.4457092881202698 }, { "epoch": 5.985915492957746, "eval_exact_match_accuracy": 0.2328042328042328, "eval_hamming_loss": 0.0718954248366013, "eval_loss": 0.5884774327278137, "eval_macro_f1": 0.2116625113728062, "eval_macro_precision": 0.3748543607342939, "eval_macro_recall": 0.16463818743176792, "eval_micro_f1": 0.4556166535742341, "eval_micro_precision": 0.8656716417910447, "eval_micro_recall": 0.3091684434968017, "eval_runtime": 2.8433, "eval_samples_per_second": 199.417, "eval_steps_per_second": 24.971, "step": 1700 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.18421414494514465, "train/contrastive_loss": 1.2526923418045044, "train/negative_loss": 1.1650878190994263, "train/num_negatives": 54, "train/num_positives": 2, "train/positive_loss": 0.08760447800159454, "train/total_loss": 0.43475261330604553 }, { "epoch": 5.985915492957746, "step": 1700, "train/classification_loss": 0.23508144915103912, "train/contrastive_loss": 2.827434539794922, "train/negative_loss": 1.0404642820358276, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 1.7869703769683838, "train/total_loss": 0.8005683422088623 }, { "epoch": 6.161971830985916, "grad_norm": 14.457427978515625, "learning_rate": 1.9768005637773083e-05, "loss": 0.7991, "step": 1750 }, { "epoch": 6.161971830985916, "step": 1750, "train/classification_loss": 0.20019212365150452, "train/contrastive_loss": 0.8180999159812927, "train/negative_loss": 0.8180310130119324, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 6.890534132253379e-05, "train/total_loss": 0.36381208896636963 }, { "epoch": 6.161971830985916, "step": 1750, "train/classification_loss": 0.17518675327301025, "train/contrastive_loss": 0.8647081851959229, "train/negative_loss": 0.5790228843688965, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.28568530082702637, "train/total_loss": 0.34812837839126587 }, { "epoch": 6.338028169014084, "grad_norm": 8.555068016052246, "learning_rate": 1.976095842142354e-05, "loss": 0.8147, "step": 1800 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.23618440330028534, "train/contrastive_loss": 2.4996490478515625, "train/negative_loss": 0.9613112211227417, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.5383377075195312, "train/total_loss": 0.7361142039299011 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.2643356919288635, "train/contrastive_loss": 1.064527988433838, "train/negative_loss": 0.4917549788951874, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.5727729797363281, "train/total_loss": 0.47724127769470215 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.2525252103805542, "train/contrastive_loss": 2.6638693809509277, "train/negative_loss": 1.0702341794967651, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.593635082244873, "train/total_loss": 0.7852991223335266 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.13786518573760986, "train/contrastive_loss": 0.6768171787261963, "train/negative_loss": 0.5316019654273987, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.14521524310112, "train/total_loss": 0.27322864532470703 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.20317767560482025, "train/contrastive_loss": 2.362442970275879, "train/negative_loss": 2.241147518157959, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.1212954893708229, "train/total_loss": 0.6756662726402283 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.20733687281608582, "train/contrastive_loss": 2.196223020553589, "train/negative_loss": 1.3789563179016113, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.8172667026519775, "train/total_loss": 0.6465814709663391 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1985493302345276, "train/contrastive_loss": 1.9548351764678955, "train/negative_loss": 0.8695181012153625, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.0853171348571777, "train/total_loss": 0.5895164012908936 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.20806984603405, "train/contrastive_loss": 1.0504621267318726, "train/negative_loss": 1.049856424331665, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.0006056473357602954, "train/total_loss": 0.4181622862815857 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.13133777678012848, "train/contrastive_loss": 0.6291182637214661, "train/negative_loss": 0.45217472314834595, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.17694354057312012, "train/total_loss": 0.2571614384651184 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.20885518193244934, "train/contrastive_loss": 1.6074930429458618, "train/negative_loss": 1.3285659551620483, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.27892711758613586, "train/total_loss": 0.5303537845611572 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.16874989867210388, "train/contrastive_loss": 1.2389817237854004, "train/negative_loss": 0.8842199444770813, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.3547617197036743, "train/total_loss": 0.4165462255477905 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.18696634471416473, "train/contrastive_loss": 1.7192937135696411, "train/negative_loss": 1.7190954685211182, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.0001982092799153179, "train/total_loss": 0.5308250784873962 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.2098003774881363, "train/contrastive_loss": 3.7497010231018066, "train/negative_loss": 2.165863037109375, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.5838379859924316, "train/total_loss": 0.9597405791282654 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1998313069343567, "train/contrastive_loss": 1.3455989360809326, "train/negative_loss": 0.9798943996429443, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.3657044768333435, "train/total_loss": 0.46895110607147217 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.14849337935447693, "train/contrastive_loss": 2.0187861919403076, "train/negative_loss": 0.6614004969596863, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.3573856353759766, "train/total_loss": 0.5522506237030029 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.18422512710094452, "train/contrastive_loss": 1.5316643714904785, "train/negative_loss": 0.697216808795929, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.8344475626945496, "train/total_loss": 0.49055802822113037 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.14369253814220428, "train/contrastive_loss": 1.3306763172149658, "train/negative_loss": 0.7949985265731812, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5356777310371399, "train/total_loss": 0.4098278284072876 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.20878709852695465, "train/contrastive_loss": 1.59965980052948, "train/negative_loss": 1.4177470207214355, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.18191276490688324, "train/total_loss": 0.5287190675735474 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1755540668964386, "train/contrastive_loss": 0.5103244781494141, "train/negative_loss": 0.47977203130722046, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.030552471056580544, "train/total_loss": 0.27761897444725037 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.19091834127902985, "train/contrastive_loss": 3.2964799404144287, "train/negative_loss": 1.5835227966308594, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.7129571437835693, "train/total_loss": 0.8502143025398254 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.15718308091163635, "train/contrastive_loss": 1.6903914213180542, "train/negative_loss": 1.6703453063964844, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.020046083256602287, "train/total_loss": 0.49526137113571167 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.13766010105609894, "train/contrastive_loss": 2.6639468669891357, "train/negative_loss": 1.8816156387329102, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.7823312282562256, "train/total_loss": 0.6704494953155518 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1847010850906372, "train/contrastive_loss": 2.585862636566162, "train/negative_loss": 1.293681263923645, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.2921814918518066, "train/total_loss": 0.7018736004829407 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.24528996646404266, "train/contrastive_loss": 3.4418249130249023, "train/negative_loss": 1.574407696723938, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.8674172163009644, "train/total_loss": 0.9336549639701843 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.18155448138713837, "train/contrastive_loss": 2.0227980613708496, "train/negative_loss": 0.8087050914764404, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.2140930891036987, "train/total_loss": 0.5861141085624695 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.2012697458267212, "train/contrastive_loss": 2.402578592300415, "train/negative_loss": 1.9920814037322998, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.41049715876579285, "train/total_loss": 0.6817854642868042 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.20460467040538788, "train/contrastive_loss": 1.5915348529815674, "train/negative_loss": 1.58004891872406, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.011485951952636242, "train/total_loss": 0.5229116678237915 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1931326985359192, "train/contrastive_loss": 0.20014992356300354, "train/negative_loss": 0.18774820864200592, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.012401716783642769, "train/total_loss": 0.23316268622875214 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.2523374557495117, "train/contrastive_loss": 3.8048558235168457, "train/negative_loss": 1.7720197439193726, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 2.0328359603881836, "train/total_loss": 1.0133086442947388 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.2193804532289505, "train/contrastive_loss": 0.9227731823921204, "train/negative_loss": 0.9027462005615234, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.020026957616209984, "train/total_loss": 0.4039350748062134 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.16964419186115265, "train/contrastive_loss": 1.3177131414413452, "train/negative_loss": 1.3112902641296387, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.006422827020287514, "train/total_loss": 0.4331868290901184 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1795284003019333, "train/contrastive_loss": 1.8620396852493286, "train/negative_loss": 1.4069775342941284, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.4550621509552002, "train/total_loss": 0.5519363284111023 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.19057753682136536, "train/contrastive_loss": 1.9349257946014404, "train/negative_loss": 1.1791791915893555, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.7557465434074402, "train/total_loss": 0.577562689781189 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.21294724941253662, "train/contrastive_loss": 2.0243303775787354, "train/negative_loss": 1.519113302230835, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.5052170157432556, "train/total_loss": 0.6178133487701416 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.24014151096343994, "train/contrastive_loss": 2.0354576110839844, "train/negative_loss": 0.8759483098983765, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.1595091819763184, "train/total_loss": 0.6472330093383789 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.15081846714019775, "train/contrastive_loss": 1.7187182903289795, "train/negative_loss": 1.7186675071716309, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 5.083685027784668e-05, "train/total_loss": 0.4945621192455292 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.21892698109149933, "train/contrastive_loss": 0.8051426410675049, "train/negative_loss": 0.39136651158332825, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.413776159286499, "train/total_loss": 0.379955530166626 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.2578733563423157, "train/contrastive_loss": 2.6372523307800293, "train/negative_loss": 2.32843017578125, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.30882227420806885, "train/total_loss": 0.7853238582611084 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.21549485623836517, "train/contrastive_loss": 0.7917541265487671, "train/negative_loss": 0.43763402104377747, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.35412007570266724, "train/total_loss": 0.3738456964492798 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.282681405544281, "train/contrastive_loss": 3.414781093597412, "train/negative_loss": 2.166337251663208, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.2484439611434937, "train/total_loss": 0.9656376242637634 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.14941991865634918, "train/contrastive_loss": 0.9621403217315674, "train/negative_loss": 0.629996657371521, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.332143634557724, "train/total_loss": 0.3418479859828949 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.17254632711410522, "train/contrastive_loss": 2.058793544769287, "train/negative_loss": 1.2110460996627808, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.8477475643157959, "train/total_loss": 0.5843050479888916 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1880212128162384, "train/contrastive_loss": 0.8820734024047852, "train/negative_loss": 0.8819945454597473, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 7.886016828706488e-05, "train/total_loss": 0.36443591117858887 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.2603602111339569, "train/contrastive_loss": 1.15123450756073, "train/negative_loss": 1.1470509767532349, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.004183569457381964, "train/total_loss": 0.4906071126461029 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1882232129573822, "train/contrastive_loss": 0.6139564514160156, "train/negative_loss": 0.6025113463401794, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.011445131152868271, "train/total_loss": 0.3110145032405853 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.3184067904949188, "train/contrastive_loss": 3.5926332473754883, "train/negative_loss": 2.827404022216797, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.7652291059494019, "train/total_loss": 1.036933422088623 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.17019306123256683, "train/contrastive_loss": 1.4210273027420044, "train/negative_loss": 1.062803864479065, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.35822346806526184, "train/total_loss": 0.454398512840271 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.21009114384651184, "train/contrastive_loss": 2.857487916946411, "train/negative_loss": 2.3472461700439453, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5102417469024658, "train/total_loss": 0.7815887928009033 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.25049540400505066, "train/contrastive_loss": 2.4972052574157715, "train/negative_loss": 2.497196912765503, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 8.225474630307872e-06, "train/total_loss": 0.7499364614486694 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.20436859130859375, "train/contrastive_loss": 1.9877409934997559, "train/negative_loss": 0.980452835559845, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.0072880983352661, "train/total_loss": 0.6019167900085449 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.15812022984027863, "train/contrastive_loss": 0.2669823169708252, "train/negative_loss": 0.19041016697883606, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.07657214254140854, "train/total_loss": 0.21151669323444366 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.21329163014888763, "train/contrastive_loss": 0.8076227307319641, "train/negative_loss": 0.6478399634361267, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.1597827672958374, "train/total_loss": 0.3748161792755127 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.21620073914527893, "train/contrastive_loss": 0.8952352404594421, "train/negative_loss": 0.8577362895011902, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.03749896213412285, "train/total_loss": 0.39524778723716736 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.30255407094955444, "train/contrastive_loss": 2.703613758087158, "train/negative_loss": 1.199798822402954, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.5038150548934937, "train/total_loss": 0.843276858329773 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.14780624210834503, "train/contrastive_loss": 1.1930758953094482, "train/negative_loss": 0.36876219511032104, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.824313759803772, "train/total_loss": 0.38642144203186035 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.14649800956249237, "train/contrastive_loss": 1.084219217300415, "train/negative_loss": 0.3242172300815582, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.7600019574165344, "train/total_loss": 0.3633418679237366 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1859196573495865, "train/contrastive_loss": 2.993258237838745, "train/negative_loss": 0.9514286518096924, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 2.0418295860290527, "train/total_loss": 0.7845712900161743 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.20863163471221924, "train/contrastive_loss": 2.637061834335327, "train/negative_loss": 1.389975666999817, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.2470861673355103, "train/total_loss": 0.7360439896583557 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.21374037861824036, "train/contrastive_loss": 1.1649141311645508, "train/negative_loss": 0.9411524534225464, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.22376161813735962, "train/total_loss": 0.44672322273254395 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.13585400581359863, "train/contrastive_loss": 0.2632651627063751, "train/negative_loss": 0.24225668609142303, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.021008474752306938, "train/total_loss": 0.18850703537464142 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.19233687222003937, "train/contrastive_loss": 2.8636417388916016, "train/negative_loss": 1.3234347105026245, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.5402069091796875, "train/total_loss": 0.7650651931762695 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.26650911569595337, "train/contrastive_loss": 1.9120588302612305, "train/negative_loss": 1.7381545305252075, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.17390435934066772, "train/total_loss": 0.6489208936691284 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1460341066122055, "train/contrastive_loss": 1.1903585195541382, "train/negative_loss": 0.9340766668319702, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.2562818229198456, "train/total_loss": 0.3841058015823364 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.19368679821491241, "train/contrastive_loss": 0.8795298337936401, "train/negative_loss": 0.7353776693344116, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.14415216445922852, "train/total_loss": 0.3695927858352661 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.19111137092113495, "train/contrastive_loss": 1.9831018447875977, "train/negative_loss": 0.8209530711174011, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.1621488332748413, "train/total_loss": 0.5877317190170288 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.20079556107521057, "train/contrastive_loss": 5.566178321838379, "train/negative_loss": 5.566175937652588, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 2.3841892016207566e-06, "train/total_loss": 1.3140312433242798 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.190120667219162, "train/contrastive_loss": 0.8163983821868896, "train/negative_loss": 0.39662086963653564, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.4197775423526764, "train/total_loss": 0.3534003496170044 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.21868683397769928, "train/contrastive_loss": 2.932465076446533, "train/negative_loss": 1.7568747997283936, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.1755903959274292, "train/total_loss": 0.8051798343658447 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1656399667263031, "train/contrastive_loss": 1.8630726337432861, "train/negative_loss": 0.8169066905975342, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.046165943145752, "train/total_loss": 0.5382544994354248 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.25913915038108826, "train/contrastive_loss": 1.9436025619506836, "train/negative_loss": 1.7970094680786133, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.14659306406974792, "train/total_loss": 0.6478596925735474 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.19009657204151154, "train/contrastive_loss": 1.6608723402023315, "train/negative_loss": 1.394348382949829, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.26652395725250244, "train/total_loss": 0.5222710371017456 }, { "epoch": 6.338028169014084, "eval_exact_match_accuracy": 0.24691358024691357, "eval_hamming_loss": 0.0718954248366013, "eval_loss": 0.5680800080299377, "eval_macro_f1": 0.2427411732331366, "eval_macro_precision": 0.47275031413037283, "eval_macro_recall": 0.19414416262327208, "eval_micro_f1": 0.4746019711902957, "eval_micro_precision": 0.821522309711286, "eval_micro_recall": 0.3336886993603412, "eval_runtime": 2.8484, "eval_samples_per_second": 199.062, "eval_steps_per_second": 24.927, "step": 1800 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.1515735685825348, "train/contrastive_loss": 0.8138993382453918, "train/negative_loss": 0.6973198056221008, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.11657953262329102, "train/total_loss": 0.31435343623161316 }, { "epoch": 6.338028169014084, "step": 1800, "train/classification_loss": 0.18316659331321716, "train/contrastive_loss": 1.312180757522583, "train/negative_loss": 0.9477595686912537, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.3644212484359741, "train/total_loss": 0.44560274481773376 }, { "epoch": 6.514084507042254, "grad_norm": 30.647846221923828, "learning_rate": 1.9753911205073996e-05, "loss": 0.7836, "step": 1850 }, { "epoch": 6.514084507042254, "step": 1850, "train/classification_loss": 0.13582298159599304, "train/contrastive_loss": 0.8106577396392822, "train/negative_loss": 0.49388763308525085, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.31677013635635376, "train/total_loss": 0.2979545295238495 }, { "epoch": 6.514084507042254, "step": 1850, "train/classification_loss": 0.21405598521232605, "train/contrastive_loss": 1.100415587425232, "train/negative_loss": 0.6814552545547485, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.4189603328704834, "train/total_loss": 0.43413910269737244 }, { "epoch": 6.690140845070422, "grad_norm": 12.289376258850098, "learning_rate": 1.9746863988724457e-05, "loss": 0.8155, "step": 1900 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.23372109234333038, "train/contrastive_loss": 3.2158899307250977, "train/negative_loss": 1.3862863779067993, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.829603672027588, "train/total_loss": 0.8768990635871887 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.27038395404815674, "train/contrastive_loss": 0.7699598073959351, "train/negative_loss": 0.599881649017334, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.17007815837860107, "train/total_loss": 0.4243759214878082 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.23821960389614105, "train/contrastive_loss": 2.791719913482666, "train/negative_loss": 1.4407185316085815, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.351001262664795, "train/total_loss": 0.7965636253356934 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.14065875113010406, "train/contrastive_loss": 1.65958571434021, "train/negative_loss": 0.9428386092185974, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7167471051216125, "train/total_loss": 0.4725759029388428 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.22161826491355896, "train/contrastive_loss": 3.0368266105651855, "train/negative_loss": 2.989464521408081, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.04736214876174927, "train/total_loss": 0.8289835453033447 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.2155858427286148, "train/contrastive_loss": 2.4562065601348877, "train/negative_loss": 2.086688756942749, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.3695177435874939, "train/total_loss": 0.7068271636962891 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.19224867224693298, "train/contrastive_loss": 1.82871675491333, "train/negative_loss": 1.0345207452774048, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.7941960096359253, "train/total_loss": 0.5579920411109924 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.20780417323112488, "train/contrastive_loss": 1.473059058189392, "train/negative_loss": 1.4729293584823608, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.000129708118038252, "train/total_loss": 0.5024160146713257 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.11690351366996765, "train/contrastive_loss": 0.24079112708568573, "train/negative_loss": 0.1931220442056656, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.04766908288002014, "train/total_loss": 0.16506174206733704 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.23107852041721344, "train/contrastive_loss": 2.6729283332824707, "train/negative_loss": 1.9350939989089966, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.7378343939781189, "train/total_loss": 0.7656641602516174 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.16104593873023987, "train/contrastive_loss": 1.2811723947525024, "train/negative_loss": 0.9447054862976074, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.336466908454895, "train/total_loss": 0.4172804355621338 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1898118257522583, "train/contrastive_loss": 2.337682008743286, "train/negative_loss": 2.3365840911865234, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.001097861211746931, "train/total_loss": 0.6573482751846313 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.21859918534755707, "train/contrastive_loss": 3.874910831451416, "train/negative_loss": 2.375621795654297, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.4992889165878296, "train/total_loss": 0.9935813546180725 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.19474028050899506, "train/contrastive_loss": 1.2165257930755615, "train/negative_loss": 0.9295287132263184, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.28699710965156555, "train/total_loss": 0.4380454421043396 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.13938456773757935, "train/contrastive_loss": 1.7123061418533325, "train/negative_loss": 0.773226261138916, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.9390798807144165, "train/total_loss": 0.48184579610824585 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.17868198454380035, "train/contrastive_loss": 1.6806676387786865, "train/negative_loss": 0.8136024475097656, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.8670651912689209, "train/total_loss": 0.5148155093193054 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.13712361454963684, "train/contrastive_loss": 1.727832317352295, "train/negative_loss": 0.965118944644928, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7627133727073669, "train/total_loss": 0.48269009590148926 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.20445416867733002, "train/contrastive_loss": 1.7956867218017578, "train/negative_loss": 1.5415583848953247, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.2541283071041107, "train/total_loss": 0.5635915398597717 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.17574962973594666, "train/contrastive_loss": 0.7344685196876526, "train/negative_loss": 0.7213791012763977, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.013089398853480816, "train/total_loss": 0.32264333963394165 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1970960795879364, "train/contrastive_loss": 3.4482498168945312, "train/negative_loss": 1.6692242622375488, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.7790255546569824, "train/total_loss": 0.8867460489273071 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.15910790860652924, "train/contrastive_loss": 2.4080164432525635, "train/negative_loss": 2.366711139678955, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.04130534082651138, "train/total_loss": 0.6407111883163452 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1344788819551468, "train/contrastive_loss": 2.969633102416992, "train/negative_loss": 2.035134792327881, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.9344983100891113, "train/total_loss": 0.7284054756164551 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.18802078068256378, "train/contrastive_loss": 3.068547487258911, "train/negative_loss": 2.0661990642547607, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.0023484230041504, "train/total_loss": 0.8017302751541138 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.2385285645723343, "train/contrastive_loss": 3.411303758621216, "train/negative_loss": 1.678453803062439, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.7328499555587769, "train/total_loss": 0.9207893013954163 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.17487332224845886, "train/contrastive_loss": 1.6150904893875122, "train/negative_loss": 0.6004703044891357, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.0146201848983765, "train/total_loss": 0.4978914260864258 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.2230340838432312, "train/contrastive_loss": 3.04897141456604, "train/negative_loss": 2.6776747703552246, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.37129664421081543, "train/total_loss": 0.8328284025192261 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.20771414041519165, "train/contrastive_loss": 1.9516738653182983, "train/negative_loss": 1.9042127132415771, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0474611259996891, "train/total_loss": 0.5980489253997803 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.19842027127742767, "train/contrastive_loss": 0.6385742425918579, "train/negative_loss": 0.5296170711517334, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.10895716398954391, "train/total_loss": 0.32613512873649597 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.2546830475330353, "train/contrastive_loss": 3.3375473022460938, "train/negative_loss": 1.7217724323272705, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.6157747507095337, "train/total_loss": 0.9221925735473633 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.22745093703269958, "train/contrastive_loss": 1.483272910118103, "train/negative_loss": 1.4721198081970215, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.011153125204145908, "train/total_loss": 0.5241055488586426 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1658446192741394, "train/contrastive_loss": 1.7293444871902466, "train/negative_loss": 1.7292804718017578, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 6.39890058664605e-05, "train/total_loss": 0.5117135047912598 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1772678792476654, "train/contrastive_loss": 2.528303861618042, "train/negative_loss": 1.8653534650802612, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.662950336933136, "train/total_loss": 0.6829286813735962 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.19365540146827698, "train/contrastive_loss": 1.9069876670837402, "train/negative_loss": 1.4431899785995483, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.4637976586818695, "train/total_loss": 0.5750529766082764 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.21822020411491394, "train/contrastive_loss": 2.259861469268799, "train/negative_loss": 1.7424304485321045, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.5174309611320496, "train/total_loss": 0.6701924800872803 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.2339928299188614, "train/contrastive_loss": 1.7953006029129028, "train/negative_loss": 1.2796703577041626, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.5156302452087402, "train/total_loss": 0.5930529832839966 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.14385662972927094, "train/contrastive_loss": 1.7576894760131836, "train/negative_loss": 1.757625937461853, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 6.35528631391935e-05, "train/total_loss": 0.4953945279121399 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.21224145591259003, "train/contrastive_loss": 0.9677494168281555, "train/negative_loss": 0.7769870162010193, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.19076238572597504, "train/total_loss": 0.40579134225845337 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.26073524355888367, "train/contrastive_loss": 2.4725046157836914, "train/negative_loss": 1.906913161277771, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.56559157371521, "train/total_loss": 0.7552361488342285 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.20143432915210724, "train/contrastive_loss": 0.35213300585746765, "train/negative_loss": 0.32196640968322754, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.030166584998369217, "train/total_loss": 0.27186092734336853 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.2922963500022888, "train/contrastive_loss": 3.730564832687378, "train/negative_loss": 2.024803876876831, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.7057609558105469, "train/total_loss": 1.0384093523025513 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.14334173500537872, "train/contrastive_loss": 1.0197844505310059, "train/negative_loss": 0.7755264639854431, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.24425797164440155, "train/total_loss": 0.34729862213134766 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.16851532459259033, "train/contrastive_loss": 1.9482519626617432, "train/negative_loss": 1.5255510807037354, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4227008521556854, "train/total_loss": 0.5581657290458679 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1941116750240326, "train/contrastive_loss": 1.0349037647247314, "train/negative_loss": 1.0348531007766724, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 5.060583498561755e-05, "train/total_loss": 0.40109241008758545 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.251036137342453, "train/contrastive_loss": 1.2935383319854736, "train/negative_loss": 1.2841545343399048, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.009383788332343102, "train/total_loss": 0.5097438097000122 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.19396381080150604, "train/contrastive_loss": 1.0589491128921509, "train/negative_loss": 1.0146514177322388, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.044297702610492706, "train/total_loss": 0.40575364232063293 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.3197799026966095, "train/contrastive_loss": 2.846153736114502, "train/negative_loss": 1.9570695161819458, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.8890842795372009, "train/total_loss": 0.8890106678009033 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.17094211280345917, "train/contrastive_loss": 1.5236997604370117, "train/negative_loss": 1.1987823247909546, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.32491737604141235, "train/total_loss": 0.4756820797920227 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.19952167570590973, "train/contrastive_loss": 2.54634952545166, "train/negative_loss": 2.0986878871917725, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.44766175746917725, "train/total_loss": 0.7087915539741516 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.2637220621109009, "train/contrastive_loss": 3.4194865226745605, "train/negative_loss": 3.419389247894287, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 9.716029308037832e-05, "train/total_loss": 0.9476193785667419 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.18567171692848206, "train/contrastive_loss": 1.8019644021987915, "train/negative_loss": 0.8965386748313904, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.9054257273674011, "train/total_loss": 0.5460646152496338 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.14846765995025635, "train/contrastive_loss": 0.3383611738681793, "train/negative_loss": 0.2893919348716736, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.04896923899650574, "train/total_loss": 0.21613989770412445 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.2143513411283493, "train/contrastive_loss": 0.8977898359298706, "train/negative_loss": 0.7769964337348938, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.1207934021949768, "train/total_loss": 0.3939093053340912 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.20978379249572754, "train/contrastive_loss": 0.9033424854278564, "train/negative_loss": 0.879086971282959, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.024255530908703804, "train/total_loss": 0.3904522955417633 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.2949010133743286, "train/contrastive_loss": 2.775782585144043, "train/negative_loss": 1.5411112308502197, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.2346712350845337, "train/total_loss": 0.8500575423240662 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1392522156238556, "train/contrastive_loss": 0.5150004625320435, "train/negative_loss": 0.3977017104625702, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.11729878187179565, "train/total_loss": 0.24225232005119324 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1353110373020172, "train/contrastive_loss": 0.6411240100860596, "train/negative_loss": 0.3942115008831024, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.24691250920295715, "train/total_loss": 0.26353585720062256 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.16366037726402283, "train/contrastive_loss": 0.9654884338378906, "train/negative_loss": 0.8125596046447754, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.15292885899543762, "train/total_loss": 0.3567580580711365 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.21263548731803894, "train/contrastive_loss": 3.341897964477539, "train/negative_loss": 1.6389883756637573, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.7029095888137817, "train/total_loss": 0.8810150623321533 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.20965367555618286, "train/contrastive_loss": 1.287813425064087, "train/negative_loss": 0.9864407777786255, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.3013727068901062, "train/total_loss": 0.4672163724899292 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.12619730830192566, "train/contrastive_loss": 0.20683008432388306, "train/negative_loss": 0.18669262528419495, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.020137455314397812, "train/total_loss": 0.1675633192062378 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1951521784067154, "train/contrastive_loss": 2.7269630432128906, "train/negative_loss": 1.184470772743225, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.5424922704696655, "train/total_loss": 0.7405447959899902 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.27544525265693665, "train/contrastive_loss": 2.3511710166931152, "train/negative_loss": 1.8781392574310303, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.47303175926208496, "train/total_loss": 0.745679497718811 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.13615156710147858, "train/contrastive_loss": 2.0564262866973877, "train/negative_loss": 1.1554896831512451, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.9009365439414978, "train/total_loss": 0.5474368333816528 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.19944772124290466, "train/contrastive_loss": 1.4613717794418335, "train/negative_loss": 0.9308468103408813, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.5305249691009521, "train/total_loss": 0.49172207713127136 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.19426573812961578, "train/contrastive_loss": 0.9899672269821167, "train/negative_loss": 0.6158229112625122, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.3741443455219269, "train/total_loss": 0.3922591805458069 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.19476650655269623, "train/contrastive_loss": 4.197413921356201, "train/negative_loss": 4.197410583496094, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 3.564370445019449e-06, "train/total_loss": 1.0342493057250977 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.18569374084472656, "train/contrastive_loss": 0.9398561716079712, "train/negative_loss": 0.44885239005088806, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.4910038113594055, "train/total_loss": 0.3736649751663208 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.21243086457252502, "train/contrastive_loss": 1.806515097618103, "train/negative_loss": 1.6013031005859375, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.20521198213100433, "train/total_loss": 0.573733925819397 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1697894185781479, "train/contrastive_loss": 2.1891608238220215, "train/negative_loss": 1.155372142791748, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.0337885618209839, "train/total_loss": 0.6076216101646423 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.26295313239097595, "train/contrastive_loss": 2.4246573448181152, "train/negative_loss": 2.173088312149048, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.25156909227371216, "train/total_loss": 0.7478846311569214 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.2108353227376938, "train/contrastive_loss": 2.371546506881714, "train/negative_loss": 1.8840951919555664, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.48745131492614746, "train/total_loss": 0.6851446032524109 }, { "epoch": 6.690140845070422, "eval_exact_match_accuracy": 0.23985890652557318, "eval_hamming_loss": 0.07199917003838573, "eval_loss": 0.5858319997787476, "eval_macro_f1": 0.23369980164035162, "eval_macro_precision": 0.3577172514594292, "eval_macro_recall": 0.18727694783923346, "eval_micro_f1": 0.4766214177978884, "eval_micro_precision": 0.8144329896907216, "eval_micro_recall": 0.3368869936034115, "eval_runtime": 2.8614, "eval_samples_per_second": 198.153, "eval_steps_per_second": 24.813, "step": 1900 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1914425790309906, "train/contrastive_loss": 0.9861552715301514, "train/negative_loss": 0.7161850333213806, "train/num_negatives": 34, "train/num_positives": 8, "train/positive_loss": 0.26997020840644836, "train/total_loss": 0.3886736333370209 }, { "epoch": 6.690140845070422, "step": 1900, "train/classification_loss": 0.1036413162946701, "train/contrastive_loss": 0.8758577108383179, "train/negative_loss": 0.7414747476577759, "train/num_negatives": 14, "train/num_positives": 42, "train/positive_loss": 0.13438299298286438, "train/total_loss": 0.27881285548210144 }, { "epoch": 6.866197183098592, "grad_norm": 12.582423210144043, "learning_rate": 1.9739816772374912e-05, "loss": 0.8348, "step": 1950 }, { "epoch": 6.866197183098592, "step": 1950, "train/classification_loss": 0.16489115357398987, "train/contrastive_loss": 1.159151315689087, "train/negative_loss": 0.5638828277587891, "train/num_negatives": 44, "train/num_positives": 10, "train/positive_loss": 0.5952684283256531, "train/total_loss": 0.39672142267227173 }, { "epoch": 6.866197183098592, "step": 1950, "train/classification_loss": 0.1773223578929901, "train/contrastive_loss": 1.3071624040603638, "train/negative_loss": 0.7744905352592468, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.5326718688011169, "train/total_loss": 0.4387548565864563 }, { "epoch": 7.042253521126761, "grad_norm": 20.763103485107422, "learning_rate": 1.973276955602537e-05, "loss": 0.812, "step": 2000 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2362351417541504, "train/contrastive_loss": 1.8519260883331299, "train/negative_loss": 1.4278429746627808, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.42408308386802673, "train/total_loss": 0.6066203713417053 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.24857378005981445, "train/contrastive_loss": 1.9192769527435303, "train/negative_loss": 0.5345038771629333, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.3847731351852417, "train/total_loss": 0.6324291825294495 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2557935118675232, "train/contrastive_loss": 2.0504822731018066, "train/negative_loss": 1.2515318393707275, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.7989503741264343, "train/total_loss": 0.6658899784088135 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.13967962563037872, "train/contrastive_loss": 1.2220646142959595, "train/negative_loss": 0.49229907989501953, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7297655344009399, "train/total_loss": 0.3840925693511963 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.21881839632987976, "train/contrastive_loss": 2.4377989768981934, "train/negative_loss": 2.1648924350738525, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.272906631231308, "train/total_loss": 0.7063782215118408 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.20519232749938965, "train/contrastive_loss": 2.113013744354248, "train/negative_loss": 1.5762704610824585, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.5367433428764343, "train/total_loss": 0.6277951002120972 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2447187751531601, "train/contrastive_loss": 2.3133597373962402, "train/negative_loss": 1.4129846096038818, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.9003751277923584, "train/total_loss": 0.7073907256126404 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.20461270213127136, "train/contrastive_loss": 1.3597595691680908, "train/negative_loss": 1.3584171533584595, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.0013423627242445946, "train/total_loss": 0.4765646159648895 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.11606776714324951, "train/contrastive_loss": 0.7776416540145874, "train/negative_loss": 0.17869257926940918, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.5989490747451782, "train/total_loss": 0.27159610390663147 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.20091688632965088, "train/contrastive_loss": 1.4774000644683838, "train/negative_loss": 0.8960364460945129, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.5813636183738708, "train/total_loss": 0.49639689922332764 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.1626138538122177, "train/contrastive_loss": 2.7368881702423096, "train/negative_loss": 0.7150574326515198, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 2.0218307971954346, "train/total_loss": 0.7099915146827698 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.18105195462703705, "train/contrastive_loss": 1.9752154350280762, "train/negative_loss": 0.9806166887283325, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.9945988059043884, "train/total_loss": 0.5760950446128845 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.21323104202747345, "train/contrastive_loss": 4.088104248046875, "train/negative_loss": 2.310882091522217, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.7772222757339478, "train/total_loss": 1.03085196018219 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.20089012384414673, "train/contrastive_loss": 0.9459574222564697, "train/negative_loss": 0.9221904873847961, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.023766906931996346, "train/total_loss": 0.39008161425590515 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.1529805064201355, "train/contrastive_loss": 2.7501914501190186, "train/negative_loss": 0.7597729563713074, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.9904184341430664, "train/total_loss": 0.7030187845230103 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.1842104196548462, "train/contrastive_loss": 1.3468527793884277, "train/negative_loss": 0.7031615376472473, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.6436912417411804, "train/total_loss": 0.45358097553253174 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.15590372681617737, "train/contrastive_loss": 1.2907254695892334, "train/negative_loss": 0.5921145677566528, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.6986109018325806, "train/total_loss": 0.41404882073402405 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.21427588164806366, "train/contrastive_loss": 2.122995376586914, "train/negative_loss": 1.0316722393035889, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 1.0913230180740356, "train/total_loss": 0.6388749480247498 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.17009508609771729, "train/contrastive_loss": 2.3069941997528076, "train/negative_loss": 0.44117772579193115, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 1.8658164739608765, "train/total_loss": 0.6314939260482788 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.19829769432544708, "train/contrastive_loss": 3.1649794578552246, "train/negative_loss": 1.2711479663848877, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.893831491470337, "train/total_loss": 0.8312935829162598 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.15294112265110016, "train/contrastive_loss": 1.5679103136062622, "train/negative_loss": 1.4811872243881226, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.08672310411930084, "train/total_loss": 0.4665231704711914 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.1360597163438797, "train/contrastive_loss": 2.8801255226135254, "train/negative_loss": 1.8268636465072632, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0532619953155518, "train/total_loss": 0.7120848298072815 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.17827272415161133, "train/contrastive_loss": 1.3183475732803345, "train/negative_loss": 1.082555890083313, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.23579168319702148, "train/total_loss": 0.4419422447681427 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.23059043288230896, "train/contrastive_loss": 2.581986427307129, "train/negative_loss": 1.0841857194900513, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.4978007078170776, "train/total_loss": 0.7469877004623413 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.1846114695072174, "train/contrastive_loss": 2.9019343852996826, "train/negative_loss": 0.7159580588340759, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 2.185976266860962, "train/total_loss": 0.7649983167648315 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2163945436477661, "train/contrastive_loss": 2.67317795753479, "train/negative_loss": 2.2118775844573975, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.46130040287971497, "train/total_loss": 0.7510301470756531 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.18990576267242432, "train/contrastive_loss": 1.328331470489502, "train/negative_loss": 1.2516578435897827, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.07667367160320282, "train/total_loss": 0.45557206869125366 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.19577154517173767, "train/contrastive_loss": 0.4446567893028259, "train/negative_loss": 0.31728339195251465, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.12737338244915009, "train/total_loss": 0.2847028970718384 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2638605833053589, "train/contrastive_loss": 3.8089709281921387, "train/negative_loss": 1.8787500858306885, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.9302209615707397, "train/total_loss": 1.0256547927856445 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.19399510324001312, "train/contrastive_loss": 0.2953444719314575, "train/negative_loss": 0.29346784949302673, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0018766270950436592, "train/total_loss": 0.25306400656700134 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.16145648062229156, "train/contrastive_loss": 0.8155556321144104, "train/negative_loss": 0.8145245313644409, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0010311153018847108, "train/total_loss": 0.32456761598587036 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.18451470136642456, "train/contrastive_loss": 3.1608457565307617, "train/negative_loss": 1.346009612083435, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.8148361444473267, "train/total_loss": 0.8166838884353638 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.19750577211380005, "train/contrastive_loss": 2.7886009216308594, "train/negative_loss": 1.5062581300735474, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.2823426723480225, "train/total_loss": 0.7552259564399719 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2239988148212433, "train/contrastive_loss": 1.6791869401931763, "train/negative_loss": 1.523707389831543, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.1554795205593109, "train/total_loss": 0.559836208820343 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.23329736292362213, "train/contrastive_loss": 1.4122387170791626, "train/negative_loss": 1.0055705308914185, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.40666818618774414, "train/total_loss": 0.5157451033592224 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.1416924148797989, "train/contrastive_loss": 1.7027676105499268, "train/negative_loss": 1.6979366540908813, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.004831010941416025, "train/total_loss": 0.48224592208862305 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.19002702832221985, "train/contrastive_loss": 1.052809476852417, "train/negative_loss": 0.48256024718284607, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.5702492594718933, "train/total_loss": 0.4005889296531677 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.24436832964420319, "train/contrastive_loss": 2.652658224105835, "train/negative_loss": 2.5322282314300537, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.12043005228042603, "train/total_loss": 0.774899959564209 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2173294723033905, "train/contrastive_loss": 1.050851583480835, "train/negative_loss": 0.41586580872535706, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.6349857449531555, "train/total_loss": 0.42749977111816406 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2557370960712433, "train/contrastive_loss": 3.507844924926758, "train/negative_loss": 1.7896414995193481, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.7182034254074097, "train/total_loss": 0.9573061466217041 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.15647295117378235, "train/contrastive_loss": 1.9243996143341064, "train/negative_loss": 0.8473648428916931, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.077034831047058, "train/total_loss": 0.5413528680801392 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.19858531653881073, "train/contrastive_loss": 3.264824628829956, "train/negative_loss": 1.9236528873443604, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.3411717414855957, "train/total_loss": 0.851550281047821 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.18637149035930634, "train/contrastive_loss": 0.8652422428131104, "train/negative_loss": 0.8648046851158142, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.00043756456580013037, "train/total_loss": 0.35941994190216064 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.23737040162086487, "train/contrastive_loss": 1.315877914428711, "train/negative_loss": 1.2596700191497803, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.05620790645480156, "train/total_loss": 0.5005459785461426 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.17482119798660278, "train/contrastive_loss": 0.5855051279067993, "train/negative_loss": 0.49711862206459045, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.08838652074337006, "train/total_loss": 0.2919222116470337 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.3261856138706207, "train/contrastive_loss": 3.35722017288208, "train/negative_loss": 2.8081116676330566, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.5491083860397339, "train/total_loss": 0.9976296424865723 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.1665060967206955, "train/contrastive_loss": 2.3770527839660645, "train/negative_loss": 1.1813523769378662, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.1957004070281982, "train/total_loss": 0.6419166326522827 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.19585020840168, "train/contrastive_loss": 2.3128790855407715, "train/negative_loss": 1.997403860092163, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.3154752850532532, "train/total_loss": 0.65842604637146 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.26863744854927063, "train/contrastive_loss": 1.9115461111068726, "train/negative_loss": 1.9073971509933472, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 0.004148912150412798, "train/total_loss": 0.6509466767311096 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.20195668935775757, "train/contrastive_loss": 2.6705875396728516, "train/negative_loss": 1.3570350408554077, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.3135526180267334, "train/total_loss": 0.7360742092132568 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.14928652346134186, "train/contrastive_loss": 0.4415435791015625, "train/negative_loss": 0.1442383974790573, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.2973051965236664, "train/total_loss": 0.23759523034095764 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.21754610538482666, "train/contrastive_loss": 0.9183329939842224, "train/negative_loss": 0.8456249237060547, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.07270805537700653, "train/total_loss": 0.4012126922607422 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2064519226551056, "train/contrastive_loss": 1.0396910905838013, "train/negative_loss": 0.7583673596382141, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.28132373094558716, "train/total_loss": 0.4143901467323303 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.3096502721309662, "train/contrastive_loss": 3.450502872467041, "train/negative_loss": 1.6730321645736694, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.777470588684082, "train/total_loss": 0.9997508525848389 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.14425420761108398, "train/contrastive_loss": 1.5759310722351074, "train/negative_loss": 0.5687820315361023, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.00714910030365, "train/total_loss": 0.4594404399394989 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.15498444437980652, "train/contrastive_loss": 0.9943720698356628, "train/negative_loss": 0.39699310064315796, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.5973789691925049, "train/total_loss": 0.3538588583469391 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.1753116250038147, "train/contrastive_loss": 1.2349880933761597, "train/negative_loss": 0.8611277937889099, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.37386029958724976, "train/total_loss": 0.4223092496395111 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.20669427514076233, "train/contrastive_loss": 2.516334056854248, "train/negative_loss": 1.600029468536377, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.9163047075271606, "train/total_loss": 0.7099610567092896 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2280310094356537, "train/contrastive_loss": 1.7300918102264404, "train/negative_loss": 0.9287343621253967, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.8013574481010437, "train/total_loss": 0.5740493535995483 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.1291375607252121, "train/contrastive_loss": 0.3905165195465088, "train/negative_loss": 0.36405906081199646, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.026457473635673523, "train/total_loss": 0.20724086463451385 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.18336929380893707, "train/contrastive_loss": 2.472332000732422, "train/negative_loss": 0.8201510310173035, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.6521809101104736, "train/total_loss": 0.6778357028961182 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.26893728971481323, "train/contrastive_loss": 2.540144205093384, "train/negative_loss": 2.33729887008667, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.20284537971019745, "train/total_loss": 0.7769661545753479 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.15116026997566223, "train/contrastive_loss": 3.666731357574463, "train/negative_loss": 1.3440535068511963, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.3226778507232666, "train/total_loss": 0.8845065832138062 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.19742503762245178, "train/contrastive_loss": 1.1862914562225342, "train/negative_loss": 0.8539636731147766, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.3323277235031128, "train/total_loss": 0.43468332290649414 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.19969873130321503, "train/contrastive_loss": 2.613133668899536, "train/negative_loss": 0.7444072365760803, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.868726372718811, "train/total_loss": 0.7223255038261414 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.1827583760023117, "train/contrastive_loss": 2.811319589614868, "train/negative_loss": 2.811307430267334, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 1.224303832714213e-05, "train/total_loss": 0.7450222969055176 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.18829362094402313, "train/contrastive_loss": 1.503467082977295, "train/negative_loss": 0.5310150980949402, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.9724519848823547, "train/total_loss": 0.4889870285987854 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2116677165031433, "train/contrastive_loss": 1.8518648147583008, "train/negative_loss": 1.1245393753051758, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.727325439453125, "train/total_loss": 0.5820406675338745 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.18907849490642548, "train/contrastive_loss": 3.509683132171631, "train/negative_loss": 1.1446689367294312, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.36501407623291, "train/total_loss": 0.8910151720046997 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.2407016158103943, "train/contrastive_loss": 2.019270896911621, "train/negative_loss": 1.208043098449707, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.8112277984619141, "train/total_loss": 0.6445558071136475 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.18559277057647705, "train/contrastive_loss": 0.8697998523712158, "train/negative_loss": 0.5192899703979492, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.350509911775589, "train/total_loss": 0.3595527410507202 }, { "epoch": 7.042253521126761, "eval_exact_match_accuracy": 0.24338624338624337, "eval_hamming_loss": 0.07148044402946364, "eval_loss": 0.5932103991508484, "eval_macro_f1": 0.2869839196785755, "eval_macro_precision": 0.5377193414857824, "eval_macro_recall": 0.22395556754608176, "eval_micro_f1": 0.4768413059984814, "eval_micro_precision": 0.8284960422163589, "eval_micro_recall": 0.3347547974413646, "eval_runtime": 2.8406, "eval_samples_per_second": 199.609, "eval_steps_per_second": 24.995, "step": 2000 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.19512946903705597, "train/contrastive_loss": 1.394766926765442, "train/negative_loss": 1.1764943599700928, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.2182726114988327, "train/total_loss": 0.474082887172699 }, { "epoch": 7.042253521126761, "step": 2000, "train/classification_loss": 0.14290325343608856, "train/contrastive_loss": 0.8412747979164124, "train/negative_loss": 0.8009767532348633, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.040298063308000565, "train/total_loss": 0.3111582100391388 }, { "epoch": 7.21830985915493, "grad_norm": 9.392231941223145, "learning_rate": 1.972572233967583e-05, "loss": 0.7174, "step": 2050 }, { "epoch": 7.21830985915493, "step": 2050, "train/classification_loss": 0.20707447826862335, "train/contrastive_loss": 0.46742427349090576, "train/negative_loss": 0.37921902537345886, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.0882052481174469, "train/total_loss": 0.3005593419075012 }, { "epoch": 7.21830985915493, "step": 2050, "train/classification_loss": 0.16357415914535522, "train/contrastive_loss": 0.7880473732948303, "train/negative_loss": 0.43332773447036743, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.3547196388244629, "train/total_loss": 0.32118362188339233 }, { "epoch": 7.394366197183099, "grad_norm": 13.048248291015625, "learning_rate": 1.9718675123326286e-05, "loss": 0.7735, "step": 2100 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.2355850785970688, "train/contrastive_loss": 1.9243850708007812, "train/negative_loss": 1.3720566034317017, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.5523284673690796, "train/total_loss": 0.6204621195793152 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.2805800139904022, "train/contrastive_loss": 2.2836239337921143, "train/negative_loss": 0.8140482902526855, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.4695756435394287, "train/total_loss": 0.7373048067092896 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.2488636076450348, "train/contrastive_loss": 2.5649256706237793, "train/negative_loss": 1.4715982675552368, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.0933274030685425, "train/total_loss": 0.7618488073348999 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.13060618937015533, "train/contrastive_loss": 0.8548005819320679, "train/negative_loss": 0.8200228810310364, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.03477772697806358, "train/total_loss": 0.30156630277633667 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.2158774733543396, "train/contrastive_loss": 2.6734330654144287, "train/negative_loss": 2.255758047103882, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.41767510771751404, "train/total_loss": 0.7505640983581543 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.2009315937757492, "train/contrastive_loss": 2.5592880249023438, "train/negative_loss": 1.6822422742843628, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.8770458698272705, "train/total_loss": 0.7127892374992371 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1938031017780304, "train/contrastive_loss": 1.9480438232421875, "train/negative_loss": 1.1423985958099365, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.805645227432251, "train/total_loss": 0.5834118723869324 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.21119935810565948, "train/contrastive_loss": 1.7656980752944946, "train/negative_loss": 1.7656002044677734, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 9.787561430130154e-05, "train/total_loss": 0.5643389821052551 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.10881562530994415, "train/contrastive_loss": 0.5218908190727234, "train/negative_loss": 0.2153853327035904, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.3065054714679718, "train/total_loss": 0.21319378912448883 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.21974939107894897, "train/contrastive_loss": 2.9008002281188965, "train/negative_loss": 1.8823362588882446, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.0184640884399414, "train/total_loss": 0.7999094724655151 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.15743964910507202, "train/contrastive_loss": 1.6973141431808472, "train/negative_loss": 0.9312524199485779, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.7660617232322693, "train/total_loss": 0.4969024956226349 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.18000084161758423, "train/contrastive_loss": 2.4370360374450684, "train/negative_loss": 1.3035897016525269, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.133446455001831, "train/total_loss": 0.6674080491065979 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.20252205431461334, "train/contrastive_loss": 4.0921549797058105, "train/negative_loss": 1.9788979291915894, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.1132569313049316, "train/total_loss": 1.0209530591964722 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1931208223104477, "train/contrastive_loss": 0.9694631695747375, "train/negative_loss": 0.7264527082443237, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.24301044642925262, "train/total_loss": 0.3870134651660919 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.14310020208358765, "train/contrastive_loss": 3.136925220489502, "train/negative_loss": 0.9973586797714233, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.139566421508789, "train/total_loss": 0.7704852819442749 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.17020396888256073, "train/contrastive_loss": 0.86734938621521, "train/negative_loss": 0.6761361956596375, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.19121317565441132, "train/total_loss": 0.34367385506629944 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.12875641882419586, "train/contrastive_loss": 1.9166319370269775, "train/negative_loss": 1.196470856666565, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7201610207557678, "train/total_loss": 0.5120828151702881 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.19211642444133759, "train/contrastive_loss": 0.7449772357940674, "train/negative_loss": 0.32287636399269104, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.42210087180137634, "train/total_loss": 0.3411118686199188 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.161703422665596, "train/contrastive_loss": 0.9431514143943787, "train/negative_loss": 0.9366201162338257, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.006531290244311094, "train/total_loss": 0.35033369064331055 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.19374893605709076, "train/contrastive_loss": 4.162308692932129, "train/negative_loss": 1.705967903137207, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.4563405513763428, "train/total_loss": 1.0262106657028198 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.14964060485363007, "train/contrastive_loss": 1.930443525314331, "train/negative_loss": 1.869929313659668, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.06051427125930786, "train/total_loss": 0.5357292890548706 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1389130800962448, "train/contrastive_loss": 3.3842926025390625, "train/negative_loss": 2.657822608947754, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.7264699935913086, "train/total_loss": 0.8157716393470764 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.17792023718357086, "train/contrastive_loss": 2.513064384460449, "train/negative_loss": 2.0533604621887207, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.45970404148101807, "train/total_loss": 0.6805331110954285 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.23604583740234375, "train/contrastive_loss": 2.593393325805664, "train/negative_loss": 1.6502387523651123, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.9431546926498413, "train/total_loss": 0.7547245025634766 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1863241195678711, "train/contrastive_loss": 2.0253219604492188, "train/negative_loss": 1.1448673009872437, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.8804546594619751, "train/total_loss": 0.5913885235786438 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.21107758581638336, "train/contrastive_loss": 2.7217471599578857, "train/negative_loss": 2.1596999168395996, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.5620473027229309, "train/total_loss": 0.7554270029067993 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1976681649684906, "train/contrastive_loss": 1.715854287147522, "train/negative_loss": 1.7118229866027832, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.004031301010400057, "train/total_loss": 0.5408390164375305 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.17681534588336945, "train/contrastive_loss": 0.14368316531181335, "train/negative_loss": 0.13802795112133026, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.005655211862176657, "train/total_loss": 0.20555198192596436 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.27567559480667114, "train/contrastive_loss": 2.819042205810547, "train/negative_loss": 1.5198527574539185, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.2991894483566284, "train/total_loss": 0.8394840359687805 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.20924969017505646, "train/contrastive_loss": 0.3890290856361389, "train/negative_loss": 0.3867047429084778, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0023243350442498922, "train/total_loss": 0.28705549240112305 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.17166674137115479, "train/contrastive_loss": 1.5331645011901855, "train/negative_loss": 1.520494818687439, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.012669644318521023, "train/total_loss": 0.47829964756965637 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.16858166456222534, "train/contrastive_loss": 2.918395757675171, "train/negative_loss": 2.204179048538208, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.7142167091369629, "train/total_loss": 0.7522608041763306 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.19467951357364655, "train/contrastive_loss": 1.0604459047317505, "train/negative_loss": 0.48637786507606506, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.5740680694580078, "train/total_loss": 0.40676867961883545 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.21877193450927734, "train/contrastive_loss": 2.194817304611206, "train/negative_loss": 1.7197083234786987, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.47510895133018494, "train/total_loss": 0.6577354073524475 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.23548386991024017, "train/contrastive_loss": 1.9063204526901245, "train/negative_loss": 1.3938144445419312, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.5125060081481934, "train/total_loss": 0.6167479753494263 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.15225757658481598, "train/contrastive_loss": 2.207214832305908, "train/negative_loss": 2.2071568965911865, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 5.7984703744295985e-05, "train/total_loss": 0.5937005281448364 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.19602622091770172, "train/contrastive_loss": 0.8796312212944031, "train/negative_loss": 0.6032993793487549, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.2763318419456482, "train/total_loss": 0.37195247411727905 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.24723008275032043, "train/contrastive_loss": 2.630075454711914, "train/negative_loss": 2.3886241912841797, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.24145132303237915, "train/total_loss": 0.7732452154159546 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.2137121856212616, "train/contrastive_loss": 0.9918572902679443, "train/negative_loss": 0.474529892206192, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.5173274278640747, "train/total_loss": 0.41208362579345703 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.2880937159061432, "train/contrastive_loss": 3.541677236557007, "train/negative_loss": 1.4077179431915283, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.1339592933654785, "train/total_loss": 0.9964292049407959 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.14877694845199585, "train/contrastive_loss": 1.132318139076233, "train/negative_loss": 0.7275153398513794, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.4048027992248535, "train/total_loss": 0.3752405643463135 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.18981721997261047, "train/contrastive_loss": 3.654658555984497, "train/negative_loss": 2.8217084407806396, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.8329501748085022, "train/total_loss": 0.9207489490509033 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1946374624967575, "train/contrastive_loss": 1.383418321609497, "train/negative_loss": 1.3825664520263672, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0008519234834238887, "train/total_loss": 0.47132110595703125 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.2662365436553955, "train/contrastive_loss": 2.085479259490967, "train/negative_loss": 1.7236754894256592, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.3618038594722748, "train/total_loss": 0.6833324432373047 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.18046359717845917, "train/contrastive_loss": 0.5860280990600586, "train/negative_loss": 0.5711997151374817, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.014828408136963844, "train/total_loss": 0.2976692318916321 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.31441617012023926, "train/contrastive_loss": 1.8963901996612549, "train/negative_loss": 1.2531230449676514, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.6432670950889587, "train/total_loss": 0.6936942338943481 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.16098926961421967, "train/contrastive_loss": 2.4503560066223145, "train/negative_loss": 1.1020476818084717, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.3483083248138428, "train/total_loss": 0.6510604619979858 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.19906562566757202, "train/contrastive_loss": 2.5203075408935547, "train/negative_loss": 2.0850064754486084, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.43530112504959106, "train/total_loss": 0.7031271457672119 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.24975664913654327, "train/contrastive_loss": 2.529301881790161, "train/negative_loss": 2.529297113418579, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 4.64917320641689e-06, "train/total_loss": 0.7556170225143433 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.18246497213840485, "train/contrastive_loss": 2.2353734970092773, "train/negative_loss": 1.3504908084869385, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.8848828077316284, "train/total_loss": 0.6295396685600281 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.13839206099510193, "train/contrastive_loss": 0.48033958673477173, "train/negative_loss": 0.33591514825820923, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.1444244384765625, "train/total_loss": 0.2344599813222885 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.2013828158378601, "train/contrastive_loss": 0.923154354095459, "train/negative_loss": 0.8586488962173462, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.064505435526371, "train/total_loss": 0.3860136866569519 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.213034525513649, "train/contrastive_loss": 0.9196885228157043, "train/negative_loss": 0.8416456580162048, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.07804284989833832, "train/total_loss": 0.3969722390174866 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.29486164450645447, "train/contrastive_loss": 1.887904405593872, "train/negative_loss": 1.2852332592010498, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 0.6026711463928223, "train/total_loss": 0.6724425554275513 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1399642378091812, "train/contrastive_loss": 0.5256852507591248, "train/negative_loss": 0.4322962462902069, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.09338901937007904, "train/total_loss": 0.24510128796100616 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.14409293234348297, "train/contrastive_loss": 1.1297039985656738, "train/negative_loss": 0.5489850640296936, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.580718994140625, "train/total_loss": 0.37003374099731445 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1656644195318222, "train/contrastive_loss": 2.506514310836792, "train/negative_loss": 0.6568769812583923, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.8496372699737549, "train/total_loss": 0.6669673323631287 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.21137888729572296, "train/contrastive_loss": 3.516695499420166, "train/negative_loss": 1.73699951171875, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.7796958684921265, "train/total_loss": 0.914717972278595 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.20528481900691986, "train/contrastive_loss": 1.4497418403625488, "train/negative_loss": 0.9157915711402893, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.5339502096176147, "train/total_loss": 0.4952331781387329 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.12146615982055664, "train/contrastive_loss": 0.2809399366378784, "train/negative_loss": 0.27169010043144226, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.009249835275113583, "train/total_loss": 0.17765414714813232 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.19084380567073822, "train/contrastive_loss": 1.9817817211151123, "train/negative_loss": 1.3369991779327393, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.644782543182373, "train/total_loss": 0.5872001647949219 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.29518944025039673, "train/contrastive_loss": 2.743422031402588, "train/negative_loss": 2.607961416244507, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.13546055555343628, "train/total_loss": 0.8438738584518433 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.14376363158226013, "train/contrastive_loss": 2.569751739501953, "train/negative_loss": 1.2280256748199463, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.3417261838912964, "train/total_loss": 0.6577140092849731 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.19214600324630737, "train/contrastive_loss": 1.444541335105896, "train/negative_loss": 1.348332166671753, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.09620921313762665, "train/total_loss": 0.48105427622795105 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1902756690979004, "train/contrastive_loss": 2.6923165321350098, "train/negative_loss": 0.8159744143486023, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.8763420581817627, "train/total_loss": 0.7287389636039734 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.18975751101970673, "train/contrastive_loss": 4.306968688964844, "train/negative_loss": 4.306966304779053, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 2.610688852655585e-06, "train/total_loss": 1.0511512756347656 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1805657297372818, "train/contrastive_loss": 1.6494392156600952, "train/negative_loss": 0.5808677673339844, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.0685714483261108, "train/total_loss": 0.5104535818099976 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.2143731713294983, "train/contrastive_loss": 2.3271758556365967, "train/negative_loss": 1.2828887701034546, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.044287085533142, "train/total_loss": 0.6798083782196045 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1729976236820221, "train/contrastive_loss": 3.203278064727783, "train/negative_loss": 1.3971877098083496, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.806090235710144, "train/total_loss": 0.8136532306671143 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.26526975631713867, "train/contrastive_loss": 2.9190073013305664, "train/negative_loss": 1.8765313625335693, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.0424760580062866, "train/total_loss": 0.849071204662323 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.18941755592823029, "train/contrastive_loss": 0.9748981595039368, "train/negative_loss": 0.9455454349517822, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.0293527040630579, "train/total_loss": 0.3843972086906433 }, { "epoch": 7.394366197183099, "eval_exact_match_accuracy": 0.25044091710758376, "eval_hamming_loss": 0.0724141508455234, "eval_loss": 0.5969284772872925, "eval_macro_f1": 0.2802413726884585, "eval_macro_precision": 0.4537141410850705, "eval_macro_recall": 0.22171561528881892, "eval_micro_f1": 0.48676470588235293, "eval_micro_precision": 0.7843601895734598, "eval_micro_recall": 0.35287846481876334, "eval_runtime": 2.8364, "eval_samples_per_second": 199.904, "eval_steps_per_second": 25.032, "step": 2100 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.1787373572587967, "train/contrastive_loss": 0.47825801372528076, "train/negative_loss": 0.43062078952789307, "train/num_negatives": 30, "train/num_positives": 16, "train/positive_loss": 0.0476372204720974, "train/total_loss": 0.27438896894454956 }, { "epoch": 7.394366197183099, "step": 2100, "train/classification_loss": 0.18938905000686646, "train/contrastive_loss": 1.7803001403808594, "train/negative_loss": 0.7165501713752747, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.06374990940094, "train/total_loss": 0.5454490780830383 }, { "epoch": 7.570422535211268, "grad_norm": 13.924952507019043, "learning_rate": 1.9711627906976747e-05, "loss": 0.7351, "step": 2150 }, { "epoch": 7.570422535211268, "step": 2150, "train/classification_loss": 0.20502950251102448, "train/contrastive_loss": 1.5197179317474365, "train/negative_loss": 0.3525352478027344, "train/num_negatives": 40, "train/num_positives": 4, "train/positive_loss": 1.1671826839447021, "train/total_loss": 0.5089731216430664 }, { "epoch": 7.570422535211268, "step": 2150, "train/classification_loss": 0.15141382813453674, "train/contrastive_loss": 0.9218471050262451, "train/negative_loss": 0.7828749418258667, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.1389721930027008, "train/total_loss": 0.3357832431793213 }, { "epoch": 7.746478873239437, "grad_norm": 11.801557540893555, "learning_rate": 1.9704580690627205e-05, "loss": 0.7747, "step": 2200 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.233855739235878, "train/contrastive_loss": 2.255545139312744, "train/negative_loss": 1.3012739419937134, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.954271137714386, "train/total_loss": 0.6849647760391235 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.26522618532180786, "train/contrastive_loss": 1.7616727352142334, "train/negative_loss": 0.7065722942352295, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.055100440979004, "train/total_loss": 0.6175607442855835 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.25880903005599976, "train/contrastive_loss": 3.44437837600708, "train/negative_loss": 1.8525596857070923, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.5918185710906982, "train/total_loss": 0.9476847052574158 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.12664580345153809, "train/contrastive_loss": 0.6547762751579285, "train/negative_loss": 0.6209471225738525, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.03382916375994682, "train/total_loss": 0.2576010823249817 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.2125016748905182, "train/contrastive_loss": 2.5967750549316406, "train/negative_loss": 2.051178455352783, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.5455965995788574, "train/total_loss": 0.7318567037582397 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.19362123310565948, "train/contrastive_loss": 2.632143259048462, "train/negative_loss": 1.5997766256332397, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.0323666334152222, "train/total_loss": 0.7200498580932617 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.20858298242092133, "train/contrastive_loss": 1.524407982826233, "train/negative_loss": 1.1166682243347168, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.4077397286891937, "train/total_loss": 0.5134645700454712 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.21285325288772583, "train/contrastive_loss": 1.9451953172683716, "train/negative_loss": 1.9451572895050049, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 3.802848732448183e-05, "train/total_loss": 0.601892352104187 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.1049819067120552, "train/contrastive_loss": 0.36691170930862427, "train/negative_loss": 0.3426990211009979, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.024212701246142387, "train/total_loss": 0.17836424708366394 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.1960151195526123, "train/contrastive_loss": 2.0619232654571533, "train/negative_loss": 0.9810680747032166, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.0808552503585815, "train/total_loss": 0.6083997488021851 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.15617330372333527, "train/contrastive_loss": 1.9075117111206055, "train/negative_loss": 0.790858805179596, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 1.1166529655456543, "train/total_loss": 0.537675678730011 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.1824103146791458, "train/contrastive_loss": 3.035715103149414, "train/negative_loss": 1.5830165147781372, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.4526987075805664, "train/total_loss": 0.7895533442497253 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.20614732801914215, "train/contrastive_loss": 3.8229174613952637, "train/negative_loss": 1.84385085105896, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.9790666103363037, "train/total_loss": 0.9707308411598206 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.17775031924247742, "train/contrastive_loss": 1.8375892639160156, "train/negative_loss": 1.0210528373718262, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.8165364861488342, "train/total_loss": 0.545268177986145 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.14816974103450775, "train/contrastive_loss": 2.6717758178710938, "train/negative_loss": 0.7289735674858093, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.9428021907806396, "train/total_loss": 0.6825249195098877 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.16398699581623077, "train/contrastive_loss": 0.9612963199615479, "train/negative_loss": 0.48294222354888916, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.4783541262149811, "train/total_loss": 0.3562462627887726 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.13100416958332062, "train/contrastive_loss": 1.0867034196853638, "train/negative_loss": 0.35729482769966125, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7294086217880249, "train/total_loss": 0.3483448624610901 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.20591473579406738, "train/contrastive_loss": 1.6879944801330566, "train/negative_loss": 0.47784149646759033, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 1.2101529836654663, "train/total_loss": 0.5435136556625366 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.15839135646820068, "train/contrastive_loss": 0.7127677202224731, "train/negative_loss": 0.5803985595703125, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.13236914575099945, "train/total_loss": 0.3009449243545532 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.19651007652282715, "train/contrastive_loss": 3.902580738067627, "train/negative_loss": 1.6494033336639404, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.2531774044036865, "train/total_loss": 0.9770262241363525 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.15365880727767944, "train/contrastive_loss": 2.353194236755371, "train/negative_loss": 2.1736857891082764, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.17950856685638428, "train/total_loss": 0.6242976188659668 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.12539084255695343, "train/contrastive_loss": 2.483067035675049, "train/negative_loss": 1.8802618980407715, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.6028050184249878, "train/total_loss": 0.6220042705535889 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.17275339365005493, "train/contrastive_loss": 2.908426523208618, "train/negative_loss": 1.844923973083496, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.063502550125122, "train/total_loss": 0.7544386982917786 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.2464851438999176, "train/contrastive_loss": 2.5663833618164062, "train/negative_loss": 1.0961732864379883, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.470210075378418, "train/total_loss": 0.7597618103027344 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.19305849075317383, "train/contrastive_loss": 3.053581476211548, "train/negative_loss": 0.7467369437217712, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 2.306844472885132, "train/total_loss": 0.8037747740745544 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.2186601161956787, "train/contrastive_loss": 3.229010820388794, "train/negative_loss": 2.1998815536499023, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0291292667388916, "train/total_loss": 0.8644623160362244 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.19897770881652832, "train/contrastive_loss": 1.5801575183868408, "train/negative_loss": 1.565502643585205, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.014654901809990406, "train/total_loss": 0.5150092244148254 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.17531105875968933, "train/contrastive_loss": 0.21678856015205383, "train/negative_loss": 0.20787391066551208, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.008914647623896599, "train/total_loss": 0.21866877377033234 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.2555426061153412, "train/contrastive_loss": 2.9623093605041504, "train/negative_loss": 1.7703056335449219, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.192003607749939, "train/total_loss": 0.8480044603347778 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.2015833854675293, "train/contrastive_loss": 0.5235978960990906, "train/negative_loss": 0.5213149785995483, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.002282913774251938, "train/total_loss": 0.3063029646873474 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.16498155891895294, "train/contrastive_loss": 1.116623878479004, "train/negative_loss": 1.1126141548156738, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.004009678494185209, "train/total_loss": 0.38830631971359253 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.16207949817180634, "train/contrastive_loss": 2.4319911003112793, "train/negative_loss": 1.3011422157287598, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.130849003791809, "train/total_loss": 0.6484777331352234 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.1915922313928604, "train/contrastive_loss": 1.2845745086669922, "train/negative_loss": 0.7174274325370789, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.5671471357345581, "train/total_loss": 0.4485071301460266 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.21791309118270874, "train/contrastive_loss": 2.680976629257202, "train/negative_loss": 2.04085111618042, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.6401254534721375, "train/total_loss": 0.7541084289550781 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.22994616627693176, "train/contrastive_loss": 2.007884979248047, "train/negative_loss": 1.3865667581558228, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.6213181614875793, "train/total_loss": 0.6315231323242188 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.1472579389810562, "train/contrastive_loss": 2.277780294418335, "train/negative_loss": 2.277631998062134, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.00014824021491222084, "train/total_loss": 0.6028140187263489 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.18912053108215332, "train/contrastive_loss": 1.2177939414978027, "train/negative_loss": 0.8141074776649475, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.40368643403053284, "train/total_loss": 0.43267932534217834 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.23758885264396667, "train/contrastive_loss": 2.508648157119751, "train/negative_loss": 2.180753469467163, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.3278946280479431, "train/total_loss": 0.7393184900283813 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.20018039643764496, "train/contrastive_loss": 1.1913447380065918, "train/negative_loss": 0.5931902527809143, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.5981545448303223, "train/total_loss": 0.43844935297966003 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.2322784960269928, "train/contrastive_loss": 4.559499740600586, "train/negative_loss": 1.970737338066101, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.5887622833251953, "train/total_loss": 1.1441785097122192 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.14572544395923615, "train/contrastive_loss": 1.8016914129257202, "train/negative_loss": 0.6206285953521729, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.1810628175735474, "train/total_loss": 0.5060637593269348 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.20211629569530487, "train/contrastive_loss": 3.5900676250457764, "train/negative_loss": 1.8990634679794312, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.6910041570663452, "train/total_loss": 0.9201298356056213 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.17881852388381958, "train/contrastive_loss": 1.219581961631775, "train/negative_loss": 1.2170060873031616, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0025759157724678516, "train/total_loss": 0.42273491621017456 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.24955160915851593, "train/contrastive_loss": 1.1467219591140747, "train/negative_loss": 1.0726075172424316, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.07411445677280426, "train/total_loss": 0.47889602184295654 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.17249681055545807, "train/contrastive_loss": 0.6076031923294067, "train/negative_loss": 0.5369259715080261, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.07067721337080002, "train/total_loss": 0.2940174341201782 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.32010331749916077, "train/contrastive_loss": 2.603621244430542, "train/negative_loss": 1.6959607601165771, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.9076604843139648, "train/total_loss": 0.8408275842666626 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.16025418043136597, "train/contrastive_loss": 1.9934375286102295, "train/negative_loss": 1.0865634679794312, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.9068740606307983, "train/total_loss": 0.5589417219161987 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.19057223200798035, "train/contrastive_loss": 2.7621850967407227, "train/negative_loss": 2.4370157718658447, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.3251693844795227, "train/total_loss": 0.7430092096328735 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.24548520147800446, "train/contrastive_loss": 2.1916701793670654, "train/negative_loss": 2.191657543182373, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 1.2517053619376384e-05, "train/total_loss": 0.6838192343711853 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.1856653392314911, "train/contrastive_loss": 2.384842872619629, "train/negative_loss": 1.2399189472198486, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.1449238061904907, "train/total_loss": 0.6626338958740234 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.14005175232887268, "train/contrastive_loss": 0.5830338001251221, "train/negative_loss": 0.20902292430400848, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.3740108907222748, "train/total_loss": 0.25665852427482605 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.20500682294368744, "train/contrastive_loss": 0.9195634126663208, "train/negative_loss": 0.9051429033279419, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.014420506544411182, "train/total_loss": 0.38891950249671936 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.20003816485404968, "train/contrastive_loss": 1.102660894393921, "train/negative_loss": 0.8248953819274902, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.27776557207107544, "train/total_loss": 0.42057034373283386 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.30356451869010925, "train/contrastive_loss": 3.1805849075317383, "train/negative_loss": 1.5772780179977417, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.603306770324707, "train/total_loss": 0.9396815299987793 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.13979889452457428, "train/contrastive_loss": 0.9882224798202515, "train/negative_loss": 0.35013994574546814, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.6380825042724609, "train/total_loss": 0.33744341135025024 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.1323823183774948, "train/contrastive_loss": 0.7261881232261658, "train/negative_loss": 0.29895681142807007, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.4272313117980957, "train/total_loss": 0.27761995792388916 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.16428159177303314, "train/contrastive_loss": 2.120096206665039, "train/negative_loss": 0.7873652577400208, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.3327308893203735, "train/total_loss": 0.5883008241653442 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.2014031857252121, "train/contrastive_loss": 2.4253745079040527, "train/negative_loss": 1.2768518924713135, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.1485224962234497, "train/total_loss": 0.6864780783653259 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.2026602178812027, "train/contrastive_loss": 0.9674946665763855, "train/negative_loss": 0.6935701966285706, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.27392446994781494, "train/total_loss": 0.39615917205810547 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.1142815425992012, "train/contrastive_loss": 0.11571035534143448, "train/negative_loss": 0.10615988075733185, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.00955047644674778, "train/total_loss": 0.13742361962795258 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.18858285248279572, "train/contrastive_loss": 2.473759412765503, "train/negative_loss": 1.0796419382095337, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.3941174745559692, "train/total_loss": 0.6833347678184509 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.24107052385807037, "train/contrastive_loss": 2.9323906898498535, "train/negative_loss": 1.4752857685089111, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 1.4571049213409424, "train/total_loss": 0.8275486826896667 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.14782081544399261, "train/contrastive_loss": 2.7027158737182617, "train/negative_loss": 1.2966796159744263, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.406036376953125, "train/total_loss": 0.6883640289306641 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.18904618918895721, "train/contrastive_loss": 1.1094850301742554, "train/negative_loss": 0.8641249537467957, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.24536004662513733, "train/total_loss": 0.4109432101249695 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.19876940548419952, "train/contrastive_loss": 2.6384170055389404, "train/negative_loss": 1.0102717876434326, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.6281452178955078, "train/total_loss": 0.7264528274536133 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.171685129404068, "train/contrastive_loss": 3.6967501640319824, "train/negative_loss": 3.696747303009033, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 2.849109705493902e-06, "train/total_loss": 0.9110351800918579 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.18085412681102753, "train/contrastive_loss": 1.8239394426345825, "train/negative_loss": 0.6054428815841675, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.218496561050415, "train/total_loss": 0.5456420183181763 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.21124012768268585, "train/contrastive_loss": 2.7942728996276855, "train/negative_loss": 1.3598989248275757, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.4343738555908203, "train/total_loss": 0.7700946927070618 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.16738319396972656, "train/contrastive_loss": 3.5876283645629883, "train/negative_loss": 1.4816099405288696, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.106018543243408, "train/total_loss": 0.8849088549613953 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.26058894395828247, "train/contrastive_loss": 2.2595388889312744, "train/negative_loss": 1.5896544456481934, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.6698843836784363, "train/total_loss": 0.7124967575073242 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.16976019740104675, "train/contrastive_loss": 0.4422369599342346, "train/negative_loss": 0.39408010244369507, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.04815686121582985, "train/total_loss": 0.2582075893878937 }, { "epoch": 7.746478873239437, "eval_exact_match_accuracy": 0.27336860670194, "eval_hamming_loss": 0.0706504824151883, "eval_loss": 0.598036527633667, "eval_macro_f1": 0.31422932723861985, "eval_macro_precision": 0.5684405947030052, "eval_macro_recall": 0.24597270648439978, "eval_micro_f1": 0.5047272727272727, "eval_micro_precision": 0.7940503432494279, "eval_micro_recall": 0.3699360341151386, "eval_runtime": 2.842, "eval_samples_per_second": 199.507, "eval_steps_per_second": 24.982, "step": 2200 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.12398000061511993, "train/contrastive_loss": 1.5109673738479614, "train/negative_loss": 0.7682982087135315, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7426691651344299, "train/total_loss": 0.42617350816726685 }, { "epoch": 7.746478873239437, "step": 2200, "train/classification_loss": 0.220085009932518, "train/contrastive_loss": 2.30934476852417, "train/negative_loss": 0.9126915335655212, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.3966532945632935, "train/total_loss": 0.6819539666175842 }, { "epoch": 7.922535211267606, "grad_norm": 21.52375602722168, "learning_rate": 1.969753347427766e-05, "loss": 0.7352, "step": 2250 }, { "epoch": 7.922535211267606, "step": 2250, "train/classification_loss": 0.1502661257982254, "train/contrastive_loss": 0.4690514802932739, "train/negative_loss": 0.36362096667289734, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.10543051362037659, "train/total_loss": 0.2440764307975769 }, { "epoch": 7.922535211267606, "step": 2250, "train/classification_loss": 0.14285258948802948, "train/contrastive_loss": 0.36563462018966675, "train/negative_loss": 0.35940900444984436, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.00622561713680625, "train/total_loss": 0.21597951650619507 }, { "epoch": 8.098591549295774, "grad_norm": 6.245151519775391, "learning_rate": 1.969048625792812e-05, "loss": 0.6935, "step": 2300 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2442706674337387, "train/contrastive_loss": 2.3785529136657715, "train/negative_loss": 1.3433853387832642, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.0351674556732178, "train/total_loss": 0.7199812531471252 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2727251350879669, "train/contrastive_loss": 1.3389389514923096, "train/negative_loss": 0.6907218098640442, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.6482172012329102, "train/total_loss": 0.5405129194259644 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.25447356700897217, "train/contrastive_loss": 2.2609119415283203, "train/negative_loss": 1.1106691360473633, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.1502426862716675, "train/total_loss": 0.7066559791564941 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1366354376077652, "train/contrastive_loss": 2.00216007232666, "train/negative_loss": 1.5390781164169312, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.46308207511901855, "train/total_loss": 0.5370674729347229 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.19932346045970917, "train/contrastive_loss": 2.6040477752685547, "train/negative_loss": 2.457207679748535, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.14684009552001953, "train/total_loss": 0.7201330661773682 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.20630595088005066, "train/contrastive_loss": 2.2803642749786377, "train/negative_loss": 1.6419827938079834, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.6383814215660095, "train/total_loss": 0.6623787879943848 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.18988202512264252, "train/contrastive_loss": 1.6799254417419434, "train/negative_loss": 0.996150016784668, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.6837754845619202, "train/total_loss": 0.5258671045303345 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.218847393989563, "train/contrastive_loss": 1.7794795036315918, "train/negative_loss": 1.7788747549057007, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.00060469307936728, "train/total_loss": 0.5747432708740234 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.10503634065389633, "train/contrastive_loss": 0.46098262071609497, "train/negative_loss": 0.3858431279659271, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.07513950765132904, "train/total_loss": 0.19723287224769592 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.18408505618572235, "train/contrastive_loss": 1.5874762535095215, "train/negative_loss": 1.101678729057312, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.48579755425453186, "train/total_loss": 0.5015802979469299 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1481398195028305, "train/contrastive_loss": 1.0276883840560913, "train/negative_loss": 0.9641227722167969, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.06356561928987503, "train/total_loss": 0.35367751121520996 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.18674065172672272, "train/contrastive_loss": 1.9973684549331665, "train/negative_loss": 1.9967641830444336, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.0006042941240593791, "train/total_loss": 0.5862143635749817 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.21244896948337555, "train/contrastive_loss": 3.3329052925109863, "train/negative_loss": 2.1440296173095703, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.1888757944107056, "train/total_loss": 0.8790300488471985 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1680147498846054, "train/contrastive_loss": 0.9330901503562927, "train/negative_loss": 0.8515809178352356, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.08150923997163773, "train/total_loss": 0.35463279485702515 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.13100989162921906, "train/contrastive_loss": 2.4437777996063232, "train/negative_loss": 0.763271152973175, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.680506706237793, "train/total_loss": 0.6197654604911804 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.16607040166854858, "train/contrastive_loss": 1.2120912075042725, "train/negative_loss": 0.7495582103729248, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.46253302693367004, "train/total_loss": 0.4084886312484741 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.12100114673376083, "train/contrastive_loss": 1.183854579925537, "train/negative_loss": 0.6361507177352905, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5477039217948914, "train/total_loss": 0.3577720522880554 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.18046681582927704, "train/contrastive_loss": 0.9073315858840942, "train/negative_loss": 0.5911673307418823, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.3161642849445343, "train/total_loss": 0.3619331419467926 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1572113335132599, "train/contrastive_loss": 0.7504340410232544, "train/negative_loss": 0.7349439859390259, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.015490069054067135, "train/total_loss": 0.30729812383651733 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.20097024738788605, "train/contrastive_loss": 3.7277727127075195, "train/negative_loss": 1.5457643270492554, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.1820082664489746, "train/total_loss": 0.9465247988700867 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.15162619948387146, "train/contrastive_loss": 2.49060320854187, "train/negative_loss": 2.3157835006713867, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.17481963336467743, "train/total_loss": 0.649746835231781 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1228061392903328, "train/contrastive_loss": 2.7641682624816895, "train/negative_loss": 2.17568302154541, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.5884852409362793, "train/total_loss": 0.675639808177948 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1735696792602539, "train/contrastive_loss": 2.5100314617156982, "train/negative_loss": 2.0456044673919678, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.4644269347190857, "train/total_loss": 0.6755759716033936 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.24511320888996124, "train/contrastive_loss": 3.0371694564819336, "train/negative_loss": 2.0945348739624023, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.9426344633102417, "train/total_loss": 0.8525471091270447 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1792777180671692, "train/contrastive_loss": 1.6307547092437744, "train/negative_loss": 0.9269121885299683, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.7038425207138062, "train/total_loss": 0.505428671836853 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2391292303800583, "train/contrastive_loss": 3.885842800140381, "train/negative_loss": 3.1626739501953125, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.7231688499450684, "train/total_loss": 1.0162978172302246 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.19246800243854523, "train/contrastive_loss": 1.6253114938735962, "train/negative_loss": 1.6245441436767578, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0007673421059735119, "train/total_loss": 0.5175303220748901 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.18269632756710052, "train/contrastive_loss": 0.24485749006271362, "train/negative_loss": 0.20135609805583954, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.043501388281583786, "train/total_loss": 0.23166783154010773 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.26650598645210266, "train/contrastive_loss": 2.9885897636413574, "train/negative_loss": 1.6735867261886597, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.3150030374526978, "train/total_loss": 0.8642239570617676 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.20834429562091827, "train/contrastive_loss": 1.2400048971176147, "train/negative_loss": 1.2383698225021362, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0016350996447727084, "train/total_loss": 0.45634526014328003 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1626977175474167, "train/contrastive_loss": 1.3122689723968506, "train/negative_loss": 1.306136965751648, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0061319489032030106, "train/total_loss": 0.425151526927948 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.16451436281204224, "train/contrastive_loss": 2.6817378997802734, "train/negative_loss": 1.554318904876709, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.127418875694275, "train/total_loss": 0.700861930847168 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.18853893876075745, "train/contrastive_loss": 1.156378984451294, "train/negative_loss": 0.5881754755973816, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.5682035684585571, "train/total_loss": 0.41981473565101624 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.23048639297485352, "train/contrastive_loss": 2.103973865509033, "train/negative_loss": 1.7719988822937012, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.3319750726222992, "train/total_loss": 0.6512811779975891 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.24674762785434723, "train/contrastive_loss": 1.657181739807129, "train/negative_loss": 1.3021827936172485, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.35499894618988037, "train/total_loss": 0.5781840085983276 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.14322857558727264, "train/contrastive_loss": 2.511337995529175, "train/negative_loss": 2.511237144470215, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.00010087047121487558, "train/total_loss": 0.6454961895942688 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2110125571489334, "train/contrastive_loss": 1.54874587059021, "train/negative_loss": 0.8461430668830872, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.702602744102478, "train/total_loss": 0.5207617282867432 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2378484010696411, "train/contrastive_loss": 1.8977556228637695, "train/negative_loss": 1.5594482421875, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.33830738067626953, "train/total_loss": 0.6173995733261108 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.20430578291416168, "train/contrastive_loss": 0.7996668219566345, "train/negative_loss": 0.3860071003437042, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.4136597216129303, "train/total_loss": 0.3642391562461853 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2435009628534317, "train/contrastive_loss": 3.9582719802856445, "train/negative_loss": 1.2625460624694824, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.695725917816162, "train/total_loss": 1.0351554155349731 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.14390785992145538, "train/contrastive_loss": 1.3989417552947998, "train/negative_loss": 0.8301483988761902, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.5687934160232544, "train/total_loss": 0.42369621992111206 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.16942669451236725, "train/contrastive_loss": 2.480360507965088, "train/negative_loss": 1.3820008039474487, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.0983595848083496, "train/total_loss": 0.6654987931251526 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.17368774116039276, "train/contrastive_loss": 0.5367939472198486, "train/negative_loss": 0.5365847945213318, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.00020916196808684617, "train/total_loss": 0.2810465395450592 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2790934145450592, "train/contrastive_loss": 1.247010350227356, "train/negative_loss": 1.0117290019989014, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.23528137803077698, "train/total_loss": 0.5284954905509949 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.17889797687530518, "train/contrastive_loss": 0.9467892646789551, "train/negative_loss": 0.9327142834663391, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.014075009152293205, "train/total_loss": 0.3682558536529541 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.32379627227783203, "train/contrastive_loss": 2.387416362762451, "train/negative_loss": 1.2085150480270386, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.1789014339447021, "train/total_loss": 0.8012795448303223 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1566537767648697, "train/contrastive_loss": 1.6297328472137451, "train/negative_loss": 1.0654380321502686, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.5642948150634766, "train/total_loss": 0.4826003313064575 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2062344253063202, "train/contrastive_loss": 3.2087810039520264, "train/negative_loss": 2.774134397506714, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4346466660499573, "train/total_loss": 0.8479906320571899 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.22560301423072815, "train/contrastive_loss": 2.996796131134033, "train/negative_loss": 2.996795177459717, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 9.536747711536009e-07, "train/total_loss": 0.8249622583389282 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1849716305732727, "train/contrastive_loss": 2.3432679176330566, "train/negative_loss": 1.2241214513778687, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.1191463470458984, "train/total_loss": 0.6536252498626709 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.12908166646957397, "train/contrastive_loss": 0.1698368489742279, "train/negative_loss": 0.10628936439752579, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.06354749202728271, "train/total_loss": 0.16304904222488403 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.18918542563915253, "train/contrastive_loss": 0.9553216695785522, "train/negative_loss": 0.9142136573791504, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.041108034551143646, "train/total_loss": 0.3802497684955597 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2061411440372467, "train/contrastive_loss": 1.1246836185455322, "train/negative_loss": 1.087032675743103, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.037650998681783676, "train/total_loss": 0.43107786774635315 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.29631879925727844, "train/contrastive_loss": 2.7426772117614746, "train/negative_loss": 1.6752409934997559, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.0674362182617188, "train/total_loss": 0.8448542356491089 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.13911233842372894, "train/contrastive_loss": 0.5739650726318359, "train/negative_loss": 0.3104524314403534, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.26351261138916016, "train/total_loss": 0.25390535593032837 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.12644430994987488, "train/contrastive_loss": 0.8025156259536743, "train/negative_loss": 0.2920730710029602, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.5104425549507141, "train/total_loss": 0.28694742918014526 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1651710867881775, "train/contrastive_loss": 1.9835624694824219, "train/negative_loss": 0.7725695371627808, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.2109929323196411, "train/total_loss": 0.5618835687637329 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2049207091331482, "train/contrastive_loss": 2.5237317085266113, "train/negative_loss": 0.8629840612411499, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.6607476472854614, "train/total_loss": 0.7096670866012573 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.18920323252677917, "train/contrastive_loss": 1.006458044052124, "train/negative_loss": 0.6816026568412781, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.32485535740852356, "train/total_loss": 0.39049482345581055 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.11797206848859787, "train/contrastive_loss": 0.553642213344574, "train/negative_loss": 0.5504075884819031, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.0032346013467758894, "train/total_loss": 0.22870051860809326 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.18942297995090485, "train/contrastive_loss": 2.5242488384246826, "train/negative_loss": 1.4783424139022827, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.0459064245224, "train/total_loss": 0.6942727565765381 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2820577621459961, "train/contrastive_loss": 2.3094828128814697, "train/negative_loss": 2.0089049339294434, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.30057796835899353, "train/total_loss": 0.7439543008804321 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.13928921520709991, "train/contrastive_loss": 2.8141512870788574, "train/negative_loss": 1.2586567401885986, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.5554946660995483, "train/total_loss": 0.7021194696426392 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.17805629968643188, "train/contrastive_loss": 1.3132739067077637, "train/negative_loss": 0.9032646417617798, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.4100092053413391, "train/total_loss": 0.4407110810279846 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1912367194890976, "train/contrastive_loss": 2.892659902572632, "train/negative_loss": 0.8198800683021545, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 2.072779893875122, "train/total_loss": 0.7697687149047852 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1900109350681305, "train/contrastive_loss": 6.243737697601318, "train/negative_loss": 6.243734836578369, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 2.8491119792306563e-06, "train/total_loss": 1.4387584924697876 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.1916729211807251, "train/contrastive_loss": 2.114192485809326, "train/negative_loss": 0.4543111324310303, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.6598812341690063, "train/total_loss": 0.6145114302635193 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.23355406522750854, "train/contrastive_loss": 3.058589458465576, "train/negative_loss": 1.378065824508667, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.6805236339569092, "train/total_loss": 0.8452719449996948 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.16609349846839905, "train/contrastive_loss": 2.6771068572998047, "train/negative_loss": 1.1652591228485107, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.511847734451294, "train/total_loss": 0.7015148401260376 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.2662345767021179, "train/contrastive_loss": 2.5414786338806152, "train/negative_loss": 2.198185443878174, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.34329307079315186, "train/total_loss": 0.774530291557312 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.16836853325366974, "train/contrastive_loss": 0.46617648005485535, "train/negative_loss": 0.4631706476211548, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.0030058410484343767, "train/total_loss": 0.26160383224487305 }, { "epoch": 8.098591549295774, "eval_exact_match_accuracy": 0.2821869488536155, "eval_hamming_loss": 0.07116920842411038, "eval_loss": 0.5833853483200073, "eval_macro_f1": 0.3069332640464957, "eval_macro_precision": 0.48224143083602977, "eval_macro_recall": 0.2493488712169924, "eval_micro_f1": 0.5134751773049645, "eval_micro_precision": 0.7669491525423728, "eval_micro_recall": 0.3859275053304904, "eval_runtime": 2.845, "eval_samples_per_second": 199.297, "eval_steps_per_second": 24.956, "step": 2300 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.10601180046796799, "train/contrastive_loss": 0.4751158058643341, "train/negative_loss": 0.4748990535736084, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.00021674255549442023, "train/total_loss": 0.20103496313095093 }, { "epoch": 8.098591549295774, "step": 2300, "train/classification_loss": 0.17395861446857452, "train/contrastive_loss": 0.9130652546882629, "train/negative_loss": 0.4688066840171814, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.44425857067108154, "train/total_loss": 0.35657167434692383 }, { "epoch": 8.274647887323944, "grad_norm": 18.140853881835938, "learning_rate": 1.968343904157858e-05, "loss": 0.7399, "step": 2350 }, { "epoch": 8.274647887323944, "step": 2350, "train/classification_loss": 0.14559383690357208, "train/contrastive_loss": 1.428407073020935, "train/negative_loss": 0.6315807104110718, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.7968263626098633, "train/total_loss": 0.43127524852752686 }, { "epoch": 8.274647887323944, "step": 2350, "train/classification_loss": 0.23761597275733948, "train/contrastive_loss": 0.7272334694862366, "train/negative_loss": 0.7253899574279785, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.0018435402307659388, "train/total_loss": 0.3830626606941223 }, { "epoch": 8.450704225352112, "grad_norm": 13.615300178527832, "learning_rate": 1.9676391825229034e-05, "loss": 0.7359, "step": 2400 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2449459731578827, "train/contrastive_loss": 2.094484567642212, "train/negative_loss": 1.164997935295105, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.9294866323471069, "train/total_loss": 0.6638429164886475 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2569793164730072, "train/contrastive_loss": 1.2955036163330078, "train/negative_loss": 0.8844051361083984, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.4110984206199646, "train/total_loss": 0.5160800218582153 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2583286762237549, "train/contrastive_loss": 2.991950035095215, "train/negative_loss": 1.8696959018707275, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.1222542524337769, "train/total_loss": 0.8567187190055847 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.14321866631507874, "train/contrastive_loss": 1.5693767070770264, "train/negative_loss": 1.141835331916809, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4275414049625397, "train/total_loss": 0.4570940136909485 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.20901921391487122, "train/contrastive_loss": 2.5436007976531982, "train/negative_loss": 2.3255441188812256, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.21805673837661743, "train/total_loss": 0.7177393436431885 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.20494309067726135, "train/contrastive_loss": 2.2672677040100098, "train/negative_loss": 1.3010964393615723, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.966171383857727, "train/total_loss": 0.6583966016769409 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.18722404539585114, "train/contrastive_loss": 1.4128552675247192, "train/negative_loss": 0.8419068455696106, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.5709484219551086, "train/total_loss": 0.4697951078414917 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1948729008436203, "train/contrastive_loss": 1.3329535722732544, "train/negative_loss": 1.3328713178634644, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 8.225779311032966e-05, "train/total_loss": 0.4614636301994324 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.10457542538642883, "train/contrastive_loss": 0.5528663396835327, "train/negative_loss": 0.35733428597450256, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.19553205370903015, "train/total_loss": 0.2151486873626709 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.168312206864357, "train/contrastive_loss": 1.2611491680145264, "train/negative_loss": 0.9446191191673279, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.3165300786495209, "train/total_loss": 0.42054206132888794 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.15372414886951447, "train/contrastive_loss": 1.440199613571167, "train/negative_loss": 0.7387551665306091, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.7014443874359131, "train/total_loss": 0.44176405668258667 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.17469422519207, "train/contrastive_loss": 2.0290565490722656, "train/negative_loss": 2.0175931453704834, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.011463319882750511, "train/total_loss": 0.5805055499076843 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.20461958646774292, "train/contrastive_loss": 3.3113276958465576, "train/negative_loss": 1.6892004013061523, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.6221272945404053, "train/total_loss": 0.8668851256370544 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.16668808460235596, "train/contrastive_loss": 1.0202604532241821, "train/negative_loss": 0.8316395878791809, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.18862083554267883, "train/total_loss": 0.3707401752471924 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1361311972141266, "train/contrastive_loss": 2.1061978340148926, "train/negative_loss": 0.8262069225311279, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.2799909114837646, "train/total_loss": 0.5573707818984985 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.15822388231754303, "train/contrastive_loss": 1.2653664350509644, "train/negative_loss": 0.40365445613861084, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.8617119789123535, "train/total_loss": 0.4112972021102905 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1280098557472229, "train/contrastive_loss": 1.095563530921936, "train/negative_loss": 0.45390164852142334, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.6416618824005127, "train/total_loss": 0.34712255001068115 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.18794164061546326, "train/contrastive_loss": 0.4926373064517975, "train/negative_loss": 0.2894083559513092, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.20322895050048828, "train/total_loss": 0.28646910190582275 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.14979209005832672, "train/contrastive_loss": 0.8436325192451477, "train/negative_loss": 0.5042153000831604, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.3394172191619873, "train/total_loss": 0.31851857900619507 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.19912217557430267, "train/contrastive_loss": 2.5443177223205566, "train/negative_loss": 1.503640055656433, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.040677547454834, "train/total_loss": 0.7079857587814331 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.16029615700244904, "train/contrastive_loss": 2.637667655944824, "train/negative_loss": 2.5243072509765625, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.11336030811071396, "train/total_loss": 0.6878296732902527 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.12428630143404007, "train/contrastive_loss": 2.6403861045837402, "train/negative_loss": 2.0968854427337646, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.5435007214546204, "train/total_loss": 0.6523635387420654 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.16106870770454407, "train/contrastive_loss": 3.2484290599823, "train/negative_loss": 1.6945791244506836, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.5538499355316162, "train/total_loss": 0.8107545375823975 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2549956738948822, "train/contrastive_loss": 3.269454002380371, "train/negative_loss": 1.4515544176101685, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.8178997039794922, "train/total_loss": 0.9088864326477051 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.18278349936008453, "train/contrastive_loss": 2.224982976913452, "train/negative_loss": 0.7934094667434692, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.431573510169983, "train/total_loss": 0.6277800798416138 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2195686250925064, "train/contrastive_loss": 3.277425527572632, "train/negative_loss": 2.4933409690856934, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.7840845584869385, "train/total_loss": 0.8750537037849426 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.19263122975826263, "train/contrastive_loss": 1.8158292770385742, "train/negative_loss": 1.8146997690200806, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0011294549331068993, "train/total_loss": 0.5557971000671387 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.16757798194885254, "train/contrastive_loss": 0.24850153923034668, "train/negative_loss": 0.22848138213157654, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.02002016268670559, "train/total_loss": 0.21727828681468964 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2757203280925751, "train/contrastive_loss": 2.6667003631591797, "train/negative_loss": 1.565339207649231, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.1013610363006592, "train/total_loss": 0.8090604543685913 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.19449162483215332, "train/contrastive_loss": 0.5649770498275757, "train/negative_loss": 0.5641927123069763, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0007843284984119236, "train/total_loss": 0.30748704075813293 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1655542105436325, "train/contrastive_loss": 1.4574739933013916, "train/negative_loss": 1.4567549228668213, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0007190585602074862, "train/total_loss": 0.45704901218414307 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.16483651101589203, "train/contrastive_loss": 2.407829761505127, "train/negative_loss": 1.40552818775177, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.0023016929626465, "train/total_loss": 0.6464024782180786 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.17835907638072968, "train/contrastive_loss": 2.0878913402557373, "train/negative_loss": 1.2990790605545044, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.7888123393058777, "train/total_loss": 0.5959373712539673 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2198270857334137, "train/contrastive_loss": 2.829572916030884, "train/negative_loss": 1.9019861221313477, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.9275867938995361, "train/total_loss": 0.7857416868209839 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.23555278778076172, "train/contrastive_loss": 1.746448040008545, "train/negative_loss": 1.2962474822998047, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.450200617313385, "train/total_loss": 0.5848424434661865 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1378675252199173, "train/contrastive_loss": 1.980405569076538, "train/negative_loss": 1.9791914224624634, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.0012141054030507803, "train/total_loss": 0.5339486598968506 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.20216575264930725, "train/contrastive_loss": 1.2747738361358643, "train/negative_loss": 0.6447005867958069, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.6300731897354126, "train/total_loss": 0.45712053775787354 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.23815526068210602, "train/contrastive_loss": 3.062293291091919, "train/negative_loss": 2.53509783744812, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.5271954536437988, "train/total_loss": 0.8506138920783997 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.20140235126018524, "train/contrastive_loss": 1.0562694072723389, "train/negative_loss": 0.7323762774467468, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.32389307022094727, "train/total_loss": 0.4126562476158142 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2705965042114258, "train/contrastive_loss": 3.890573024749756, "train/negative_loss": 2.1461291313171387, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.7444437742233276, "train/total_loss": 1.0487110614776611 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.14587567746639252, "train/contrastive_loss": 1.6785633563995361, "train/negative_loss": 0.5967957377433777, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.0817675590515137, "train/total_loss": 0.48158836364746094 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1672477424144745, "train/contrastive_loss": 1.8323241472244263, "train/negative_loss": 0.830080509185791, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.0022436380386353, "train/total_loss": 0.5337125658988953 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1621384620666504, "train/contrastive_loss": 0.747734010219574, "train/negative_loss": 0.747294008731842, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0004400020989123732, "train/total_loss": 0.3116852641105652 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.24401827156543732, "train/contrastive_loss": 1.2871679067611694, "train/negative_loss": 1.1827905178070068, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.104377381503582, "train/total_loss": 0.501451849937439 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.16784295439720154, "train/contrastive_loss": 0.9098984003067017, "train/negative_loss": 0.9028022885322571, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.007096088957041502, "train/total_loss": 0.34982264041900635 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.3237954378128052, "train/contrastive_loss": 2.385223388671875, "train/negative_loss": 1.2870439291000366, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.098179578781128, "train/total_loss": 0.8008401393890381 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.14544318616390228, "train/contrastive_loss": 2.0616774559020996, "train/negative_loss": 1.0446054935455322, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.0170719623565674, "train/total_loss": 0.5577786564826965 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.17914167046546936, "train/contrastive_loss": 2.7266931533813477, "train/negative_loss": 2.359682083129883, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.3670111894607544, "train/total_loss": 0.7244802713394165 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2335483431816101, "train/contrastive_loss": 2.696150302886963, "train/negative_loss": 2.69614839553833, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 1.7881409348774469e-06, "train/total_loss": 0.7727783918380737 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.19012564420700073, "train/contrastive_loss": 2.4143619537353516, "train/negative_loss": 1.1258702278137207, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.2884916067123413, "train/total_loss": 0.6729980707168579 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.12416550517082214, "train/contrastive_loss": 0.2659369707107544, "train/negative_loss": 0.1255723387002945, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.1403646171092987, "train/total_loss": 0.1773529052734375 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.19429625570774078, "train/contrastive_loss": 1.1504722833633423, "train/negative_loss": 0.9434749484062195, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.20699737966060638, "train/total_loss": 0.4243907332420349 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2082436978816986, "train/contrastive_loss": 1.014721155166626, "train/negative_loss": 0.8957695364952087, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.11895164847373962, "train/total_loss": 0.41118794679641724 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.29638078808784485, "train/contrastive_loss": 2.539285659790039, "train/negative_loss": 1.3751596212387085, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.1641261577606201, "train/total_loss": 0.804237961769104 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.144293412566185, "train/contrastive_loss": 1.1578879356384277, "train/negative_loss": 0.2715948224067688, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.8862931728363037, "train/total_loss": 0.3758710026741028 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1365317702293396, "train/contrastive_loss": 0.9785356521606445, "train/negative_loss": 0.26192107796669006, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.7166145443916321, "train/total_loss": 0.33223891258239746 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.18250741064548492, "train/contrastive_loss": 2.235269069671631, "train/negative_loss": 1.0084832906723022, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.226785659790039, "train/total_loss": 0.6295612454414368 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.19683633744716644, "train/contrastive_loss": 2.222316265106201, "train/negative_loss": 1.7189472913742065, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.5033690333366394, "train/total_loss": 0.6412996053695679 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.19557024538516998, "train/contrastive_loss": 0.8996196985244751, "train/negative_loss": 0.5515589118003845, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.34806081652641296, "train/total_loss": 0.37549418210983276 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.11459163576364517, "train/contrastive_loss": 0.2867501974105835, "train/negative_loss": 0.2779722213745117, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.008777974173426628, "train/total_loss": 0.17194166779518127 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.18750149011611938, "train/contrastive_loss": 2.071375608444214, "train/negative_loss": 1.2362457513809204, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.8351298570632935, "train/total_loss": 0.6017765998840332 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.2722088396549225, "train/contrastive_loss": 3.3038153648376465, "train/negative_loss": 1.9966479539871216, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 1.3071672916412354, "train/total_loss": 0.9329719543457031 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.13532032072544098, "train/contrastive_loss": 2.162440299987793, "train/negative_loss": 1.180728554725647, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.9817118048667908, "train/total_loss": 0.5678083896636963 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.18387490510940552, "train/contrastive_loss": 1.4897825717926025, "train/negative_loss": 0.8728315234184265, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.6169509887695312, "train/total_loss": 0.481831431388855 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1634780913591385, "train/contrastive_loss": 1.4458531141281128, "train/negative_loss": 0.5584594011306763, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.8873937129974365, "train/total_loss": 0.45264869928359985 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1681169867515564, "train/contrastive_loss": 4.320793151855469, "train/negative_loss": 4.320789813995361, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 3.218665369786322e-06, "train/total_loss": 1.032275676727295 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.17943213880062103, "train/contrastive_loss": 1.8562180995941162, "train/negative_loss": 0.84536212682724, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.010856032371521, "train/total_loss": 0.5506757497787476 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.20423956215381622, "train/contrastive_loss": 2.25396728515625, "train/negative_loss": 1.5905145406723022, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.6634528040885925, "train/total_loss": 0.6550330519676208 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.1618092656135559, "train/contrastive_loss": 2.6421542167663574, "train/negative_loss": 0.9217068552970886, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.7204474210739136, "train/total_loss": 0.6902401447296143 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.25699126720428467, "train/contrastive_loss": 1.65337336063385, "train/negative_loss": 1.4641841650009155, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.18918918073177338, "train/total_loss": 0.5876659154891968 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.16687235236167908, "train/contrastive_loss": 0.5587081909179688, "train/negative_loss": 0.48641812801361084, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.07229007035493851, "train/total_loss": 0.27861398458480835 }, { "epoch": 8.450704225352112, "eval_exact_match_accuracy": 0.2874779541446208, "eval_hamming_loss": 0.0682643427741467, "eval_loss": 0.5643488168716431, "eval_macro_f1": 0.3535031028397779, "eval_macro_precision": 0.5754891656934286, "eval_macro_recall": 0.2853629307270238, "eval_micro_f1": 0.5320056899004267, "eval_micro_precision": 0.7991452991452992, "eval_micro_recall": 0.39872068230277186, "eval_runtime": 2.8456, "eval_samples_per_second": 199.255, "eval_steps_per_second": 24.951, "step": 2400 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.14886359870433807, "train/contrastive_loss": 0.9310144782066345, "train/negative_loss": 0.8535827994346619, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.07743166387081146, "train/total_loss": 0.3350664973258972 }, { "epoch": 8.450704225352112, "step": 2400, "train/classification_loss": 0.13936017453670502, "train/contrastive_loss": 0.7120563983917236, "train/negative_loss": 0.6321664452552795, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0798899307847023, "train/total_loss": 0.2817714512348175 }, { "epoch": 8.626760563380282, "grad_norm": 18.51525115966797, "learning_rate": 1.9669344608879495e-05, "loss": 0.7023, "step": 2450 }, { "epoch": 8.626760563380282, "step": 2450, "train/classification_loss": 0.11917033046483994, "train/contrastive_loss": 0.31866520643234253, "train/negative_loss": 0.22773566842079163, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.0909295380115509, "train/total_loss": 0.18290337920188904 }, { "epoch": 8.626760563380282, "step": 2450, "train/classification_loss": 0.13346493244171143, "train/contrastive_loss": 0.7950259447097778, "train/negative_loss": 0.5877374410629272, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.20728850364685059, "train/total_loss": 0.29247012734413147 }, { "epoch": 8.80281690140845, "grad_norm": 10.050371170043945, "learning_rate": 1.9662297392529953e-05, "loss": 0.6547, "step": 2500 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.2511644661426544, "train/contrastive_loss": 2.6396262645721436, "train/negative_loss": 1.6967718601226807, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.9428543448448181, "train/total_loss": 0.7790896892547607 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.24657103419303894, "train/contrastive_loss": 0.7728821635246277, "train/negative_loss": 0.6604555249214172, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.11242662370204926, "train/total_loss": 0.4011474847793579 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.2421797811985016, "train/contrastive_loss": 2.3896260261535645, "train/negative_loss": 1.2844914197921753, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.1051344871520996, "train/total_loss": 0.720104992389679 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.14494135975837708, "train/contrastive_loss": 1.591440200805664, "train/negative_loss": 1.1758092641830444, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.41563090682029724, "train/total_loss": 0.4632294178009033 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.21130205690860748, "train/contrastive_loss": 2.506287097930908, "train/negative_loss": 2.0280110836029053, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.47827598452568054, "train/total_loss": 0.7125594615936279 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.20617571473121643, "train/contrastive_loss": 1.9634813070297241, "train/negative_loss": 1.2506732940673828, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.7128080129623413, "train/total_loss": 0.5988719463348389 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1936262845993042, "train/contrastive_loss": 2.0033059120178223, "train/negative_loss": 0.8608787059783936, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.1424270868301392, "train/total_loss": 0.5942875146865845 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.19313490390777588, "train/contrastive_loss": 0.7414778470993042, "train/negative_loss": 0.7409564852714539, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.000521378533449024, "train/total_loss": 0.3414304852485657 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1011158898472786, "train/contrastive_loss": 0.35006284713745117, "train/negative_loss": 0.3396986424922943, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.010364211164414883, "train/total_loss": 0.17112845182418823 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.16592451930046082, "train/contrastive_loss": 1.7435455322265625, "train/negative_loss": 1.136543869972229, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.6070016026496887, "train/total_loss": 0.5146336555480957 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1462712585926056, "train/contrastive_loss": 1.435616135597229, "train/negative_loss": 0.5031639933586121, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.9324521422386169, "train/total_loss": 0.43339449167251587 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.18088997900485992, "train/contrastive_loss": 1.6934937238693237, "train/negative_loss": 1.6808782815933228, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.012615488842129707, "train/total_loss": 0.5195887088775635 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.19819100201129913, "train/contrastive_loss": 3.67189359664917, "train/negative_loss": 2.29703950881958, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.3748542070388794, "train/total_loss": 0.9325697422027588 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1696241945028305, "train/contrastive_loss": 1.2580044269561768, "train/negative_loss": 0.9411847591400146, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.3168196976184845, "train/total_loss": 0.42122507095336914 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.13428957760334015, "train/contrastive_loss": 2.469491958618164, "train/negative_loss": 0.8042869567871094, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.6652050018310547, "train/total_loss": 0.6281879544258118 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.15965595841407776, "train/contrastive_loss": 1.5159543752670288, "train/negative_loss": 0.6359073519706726, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.8800470232963562, "train/total_loss": 0.4628468453884125 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.12364625930786133, "train/contrastive_loss": 0.8296409249305725, "train/negative_loss": 0.30147844552993774, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5281624794006348, "train/total_loss": 0.28957444429397583 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.18789976835250854, "train/contrastive_loss": 0.8999439477920532, "train/negative_loss": 0.6030117869377136, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.2969321608543396, "train/total_loss": 0.36788856983184814 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.15312260389328003, "train/contrastive_loss": 0.9006112813949585, "train/negative_loss": 0.4755997657775879, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.425011545419693, "train/total_loss": 0.33324486017227173 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.206082284450531, "train/contrastive_loss": 4.2448930740356445, "train/negative_loss": 1.7870343923568726, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.4578585624694824, "train/total_loss": 1.055060863494873 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.15332470834255219, "train/contrastive_loss": 2.7012293338775635, "train/negative_loss": 2.311882972717285, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.3893464505672455, "train/total_loss": 0.693570613861084 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1317104548215866, "train/contrastive_loss": 2.714829921722412, "train/negative_loss": 2.0845723152160645, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.6302576065063477, "train/total_loss": 0.6746764779090881 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.15104888379573822, "train/contrastive_loss": 2.1891095638275146, "train/negative_loss": 1.3497951030731201, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.8393144607543945, "train/total_loss": 0.5888708233833313 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.26691919565200806, "train/contrastive_loss": 3.4873218536376953, "train/negative_loss": 1.592253565788269, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.8950684070587158, "train/total_loss": 0.964383602142334 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.17469654977321625, "train/contrastive_loss": 2.040550947189331, "train/negative_loss": 0.7673336863517761, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.2732173204421997, "train/total_loss": 0.5828067660331726 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.210176020860672, "train/contrastive_loss": 1.7441418170928955, "train/negative_loss": 1.0948737859725952, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.6492680311203003, "train/total_loss": 0.5590044260025024 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.19292020797729492, "train/contrastive_loss": 1.745369791984558, "train/negative_loss": 1.744639277458191, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0007304659811779857, "train/total_loss": 0.5419942140579224 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.16902956366539001, "train/contrastive_loss": 0.20009179413318634, "train/negative_loss": 0.14015941321849823, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.05993238091468811, "train/total_loss": 0.20904792845249176 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.265617698431015, "train/contrastive_loss": 2.663512945175171, "train/negative_loss": 1.1290005445480347, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.5345124006271362, "train/total_loss": 0.7983202934265137 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.18727409839630127, "train/contrastive_loss": 0.918952465057373, "train/negative_loss": 0.9178711771965027, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0010813073022291064, "train/total_loss": 0.37106460332870483 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.16883639991283417, "train/contrastive_loss": 1.177332878112793, "train/negative_loss": 1.0624253749847412, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.11490747332572937, "train/total_loss": 0.4043029844760895 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.16628685593605042, "train/contrastive_loss": 2.399775505065918, "train/negative_loss": 1.6184954643249512, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.7812799215316772, "train/total_loss": 0.6462419629096985 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.17768938839435577, "train/contrastive_loss": 1.727698802947998, "train/negative_loss": 0.8660138845443726, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.8616849184036255, "train/total_loss": 0.52322918176651 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.21600525081157684, "train/contrastive_loss": 1.8556184768676758, "train/negative_loss": 1.7665786743164062, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.08903981745243073, "train/total_loss": 0.5871289372444153 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.2321563959121704, "train/contrastive_loss": 2.2539730072021484, "train/negative_loss": 1.6598936319351196, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.5940792560577393, "train/total_loss": 0.6829509735107422 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.13460731506347656, "train/contrastive_loss": 2.105048656463623, "train/negative_loss": 2.1049978733062744, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 5.0864673539763317e-05, "train/total_loss": 0.555617094039917 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1841176301240921, "train/contrastive_loss": 0.8083468675613403, "train/negative_loss": 0.3539351522922516, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.45441168546676636, "train/total_loss": 0.345786988735199 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.23715537786483765, "train/contrastive_loss": 2.8935818672180176, "train/negative_loss": 2.5387141704559326, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.35486775636672974, "train/total_loss": 0.8158717751502991 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.20092280209064484, "train/contrastive_loss": 0.7501943707466125, "train/negative_loss": 0.5360543131828308, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.21414004266262054, "train/total_loss": 0.35096168518066406 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.27190569043159485, "train/contrastive_loss": 2.9224958419799805, "train/negative_loss": 2.2097790241241455, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 0.712716817855835, "train/total_loss": 0.8564049005508423 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1484273076057434, "train/contrastive_loss": 1.7271867990493774, "train/negative_loss": 0.7041757106781006, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.0230110883712769, "train/total_loss": 0.49386468529701233 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.17107242345809937, "train/contrastive_loss": 2.5170531272888184, "train/negative_loss": 1.2578942775726318, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.2591588497161865, "train/total_loss": 0.674483060836792 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1631156951189041, "train/contrastive_loss": 0.9078551530838013, "train/negative_loss": 0.9074746966362, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.00038047906127758324, "train/total_loss": 0.34468674659729004 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.2701141834259033, "train/contrastive_loss": 1.2464015483856201, "train/negative_loss": 1.2143200635910034, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.032081447541713715, "train/total_loss": 0.5193945169448853 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.16154073178768158, "train/contrastive_loss": 1.0530773401260376, "train/negative_loss": 1.0436376333236694, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.009439758025109768, "train/total_loss": 0.37215620279312134 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.33457106351852417, "train/contrastive_loss": 2.454972267150879, "train/negative_loss": 1.4503281116485596, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.0046441555023193, "train/total_loss": 0.8255655169487 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.15463872253894806, "train/contrastive_loss": 1.6894177198410034, "train/negative_loss": 0.9045474529266357, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.7848702669143677, "train/total_loss": 0.49252229928970337 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1873106211423874, "train/contrastive_loss": 2.148073673248291, "train/negative_loss": 1.8950856924057007, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.2529880404472351, "train/total_loss": 0.6169253587722778 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.25849273800849915, "train/contrastive_loss": 3.0028321743011475, "train/negative_loss": 3.002824306488037, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 7.867844033171423e-06, "train/total_loss": 0.85905921459198 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1882040947675705, "train/contrastive_loss": 2.9411730766296387, "train/negative_loss": 1.4729305505752563, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.4682424068450928, "train/total_loss": 0.7764387130737305 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.12473208457231522, "train/contrastive_loss": 0.3067686855792999, "train/negative_loss": 0.2376350611448288, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.06913362443447113, "train/total_loss": 0.18608582019805908 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.19111350178718567, "train/contrastive_loss": 0.7253856658935547, "train/negative_loss": 0.6835953593254089, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.041790325194597244, "train/total_loss": 0.3361906409263611 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.20824451744556427, "train/contrastive_loss": 1.2593035697937012, "train/negative_loss": 0.9832590818405151, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.2760445475578308, "train/total_loss": 0.4601052403450012 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.29199981689453125, "train/contrastive_loss": 3.435810089111328, "train/negative_loss": 1.1639904975891113, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 2.271819591522217, "train/total_loss": 0.9791618585586548 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.14920663833618164, "train/contrastive_loss": 1.0227805376052856, "train/negative_loss": 0.2172389030456543, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.8055416345596313, "train/total_loss": 0.35376274585723877 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1258079558610916, "train/contrastive_loss": 1.0636166334152222, "train/negative_loss": 0.3190959393978119, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.7445207238197327, "train/total_loss": 0.3385312855243683 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.17183078825473785, "train/contrastive_loss": 3.120384693145752, "train/negative_loss": 0.8461884260177612, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 2.274196147918701, "train/total_loss": 0.795907735824585 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.19278113543987274, "train/contrastive_loss": 1.627281665802002, "train/negative_loss": 0.9829041957855225, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.6443774104118347, "train/total_loss": 0.5182374715805054 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.19485071301460266, "train/contrastive_loss": 0.9677084684371948, "train/negative_loss": 0.7169820666313171, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.2507264316082001, "train/total_loss": 0.3883923888206482 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.12035193294286728, "train/contrastive_loss": 0.5098100304603577, "train/negative_loss": 0.4969024658203125, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.012907564640045166, "train/total_loss": 0.22231394052505493 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.18376772105693817, "train/contrastive_loss": 2.4269652366638184, "train/negative_loss": 1.1219836473464966, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.3049817085266113, "train/total_loss": 0.669160783290863 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.2328861504793167, "train/contrastive_loss": 1.6766852140426636, "train/negative_loss": 1.5928853750228882, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.0837998166680336, "train/total_loss": 0.5682231783866882 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1382860541343689, "train/contrastive_loss": 1.5263104438781738, "train/negative_loss": 0.667002260684967, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.859308123588562, "train/total_loss": 0.44354814291000366 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1886458843946457, "train/contrastive_loss": 1.6759822368621826, "train/negative_loss": 1.0520031452178955, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.6239790916442871, "train/total_loss": 0.5238423347473145 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1672661006450653, "train/contrastive_loss": 2.2461981773376465, "train/negative_loss": 0.5392714738845825, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.7069268226623535, "train/total_loss": 0.6165057420730591 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.17669512331485748, "train/contrastive_loss": 5.6372222900390625, "train/negative_loss": 5.63722038269043, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 1.8477469438948901e-06, "train/total_loss": 1.3041396141052246 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.1775110512971878, "train/contrastive_loss": 2.8417880535125732, "train/negative_loss": 0.47931107878685, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 2.3624770641326904, "train/total_loss": 0.7458686828613281 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.21907341480255127, "train/contrastive_loss": 3.106001377105713, "train/negative_loss": 1.3382761478424072, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.7677253484725952, "train/total_loss": 0.8402736783027649 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.15186597406864166, "train/contrastive_loss": 1.9121085405349731, "train/negative_loss": 0.9349023103713989, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.9772062301635742, "train/total_loss": 0.534287691116333 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.26104214787483215, "train/contrastive_loss": 2.1074230670928955, "train/negative_loss": 2.0602364540100098, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.047186508774757385, "train/total_loss": 0.6825267672538757 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.15953369438648224, "train/contrastive_loss": 0.5105753540992737, "train/negative_loss": 0.5024698972702026, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.008105463348329067, "train/total_loss": 0.2616487741470337 }, { "epoch": 8.80281690140845, "eval_exact_match_accuracy": 0.2874779541446208, "eval_hamming_loss": 0.06805685237057786, "eval_loss": 0.5672438144683838, "eval_macro_f1": 0.3656328044139099, "eval_macro_precision": 0.5700484562146668, "eval_macro_recall": 0.2988843578849931, "eval_micro_f1": 0.5406162464985994, "eval_micro_precision": 0.7877551020408163, "eval_micro_recall": 0.4115138592750533, "eval_runtime": 2.8461, "eval_samples_per_second": 199.217, "eval_steps_per_second": 24.946, "step": 2500 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.09683547914028168, "train/contrastive_loss": 0.24993473291397095, "train/negative_loss": 0.23617425560951233, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.01376048382371664, "train/total_loss": 0.14682242274284363 }, { "epoch": 8.80281690140845, "step": 2500, "train/classification_loss": 0.15611132979393005, "train/contrastive_loss": 1.1421875953674316, "train/negative_loss": 0.8174611926078796, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.324726402759552, "train/total_loss": 0.3845488429069519 }, { "epoch": 8.97887323943662, "grad_norm": 10.806668281555176, "learning_rate": 1.9655250176180408e-05, "loss": 0.6965, "step": 2550 }, { "epoch": 8.97887323943662, "step": 2550, "train/classification_loss": 0.22458066046237946, "train/contrastive_loss": 0.7480671405792236, "train/negative_loss": 0.40531519055366516, "train/num_negatives": 34, "train/num_positives": 12, "train/positive_loss": 0.34275197982788086, "train/total_loss": 0.37419408559799194 }, { "epoch": 8.97887323943662, "step": 2550, "train/classification_loss": 0.1722177416086197, "train/contrastive_loss": 0.6076792478561401, "train/negative_loss": 0.574845016002655, "train/num_negatives": 28, "train/num_positives": 22, "train/positive_loss": 0.03283420950174332, "train/total_loss": 0.29375359416007996 }, { "epoch": 9.154929577464788, "grad_norm": 9.524175643920898, "learning_rate": 1.964820295983087e-05, "loss": 0.6568, "step": 2600 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.24628448486328125, "train/contrastive_loss": 2.4654972553253174, "train/negative_loss": 1.4616281986236572, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.0038690567016602, "train/total_loss": 0.7393839359283447 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.23898032307624817, "train/contrastive_loss": 0.7137899994850159, "train/negative_loss": 0.48506832122802734, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.22872166335582733, "train/total_loss": 0.3817383050918579 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.24360999464988708, "train/contrastive_loss": 2.752887487411499, "train/negative_loss": 1.7477415800094604, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.0051459074020386, "train/total_loss": 0.7941875457763672 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.14797106385231018, "train/contrastive_loss": 2.684443950653076, "train/negative_loss": 1.6355658769607544, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.0488781929016113, "train/total_loss": 0.6848598718643188 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.19469140470027924, "train/contrastive_loss": 2.277411699295044, "train/negative_loss": 1.906540870666504, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.3708707392215729, "train/total_loss": 0.6501737236976624 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.19751551747322083, "train/contrastive_loss": 2.7453670501708984, "train/negative_loss": 1.3876423835754395, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.3577245473861694, "train/total_loss": 0.746588945388794 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.2012830525636673, "train/contrastive_loss": 2.037076234817505, "train/negative_loss": 1.1387380361557007, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.8983381986618042, "train/total_loss": 0.608698308467865 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.19069236516952515, "train/contrastive_loss": 0.9895957112312317, "train/negative_loss": 0.9894549250602722, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.00014079608081374317, "train/total_loss": 0.38861149549484253 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.09525246173143387, "train/contrastive_loss": 0.8819663524627686, "train/negative_loss": 0.5683714151382446, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.31359490752220154, "train/total_loss": 0.271645724773407 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.17532993853092194, "train/contrastive_loss": 1.8370440006256104, "train/negative_loss": 1.2459131479263306, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.5911308526992798, "train/total_loss": 0.5427387356758118 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1475764960050583, "train/contrastive_loss": 1.6424684524536133, "train/negative_loss": 0.6133848428726196, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 1.0290836095809937, "train/total_loss": 0.4760701656341553 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.18745386600494385, "train/contrastive_loss": 1.9108036756515503, "train/negative_loss": 1.565867304801941, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.344936341047287, "train/total_loss": 0.5696146488189697 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.19530166685581207, "train/contrastive_loss": 3.8807806968688965, "train/negative_loss": 2.0134706497192383, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.8673100471496582, "train/total_loss": 0.9714577794075012 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.16424857079982758, "train/contrastive_loss": 1.0744452476501465, "train/negative_loss": 0.5899219512939453, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.48452332615852356, "train/total_loss": 0.37913763523101807 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.14020979404449463, "train/contrastive_loss": 2.635652780532837, "train/negative_loss": 0.7812339663505554, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.8544187545776367, "train/total_loss": 0.6673403382301331 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1672203689813614, "train/contrastive_loss": 1.307839274406433, "train/negative_loss": 0.6420754194259644, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.6657638549804688, "train/total_loss": 0.4287882447242737 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.13216516375541687, "train/contrastive_loss": 1.2569119930267334, "train/negative_loss": 0.5905213356018066, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.6663906574249268, "train/total_loss": 0.3835475742816925 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.18154656887054443, "train/contrastive_loss": 0.45820435881614685, "train/negative_loss": 0.353636234998703, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.10456812381744385, "train/total_loss": 0.27318745851516724 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.15409497916698456, "train/contrastive_loss": 1.564359188079834, "train/negative_loss": 0.5728989839553833, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.9914602637290955, "train/total_loss": 0.46696680784225464 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.21266396343708038, "train/contrastive_loss": 2.9230458736419678, "train/negative_loss": 1.4068803787231445, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.5161654949188232, "train/total_loss": 0.7972731590270996 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.13373976945877075, "train/contrastive_loss": 1.6649099588394165, "train/negative_loss": 1.5701851844787598, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.09472475200891495, "train/total_loss": 0.466721773147583 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.13529695570468903, "train/contrastive_loss": 3.0700488090515137, "train/negative_loss": 1.8356618881225586, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.234386920928955, "train/total_loss": 0.7493067383766174 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.15869060158729553, "train/contrastive_loss": 2.246107339859009, "train/negative_loss": 0.882771372795105, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.3633359670639038, "train/total_loss": 0.6079120635986328 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.25418511033058167, "train/contrastive_loss": 3.2660160064697266, "train/negative_loss": 1.8137931823730469, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.4522228240966797, "train/total_loss": 0.9073883295059204 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.18978899717330933, "train/contrastive_loss": 2.1697194576263428, "train/negative_loss": 0.8105581998825073, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.3591612577438354, "train/total_loss": 0.6237329244613647 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.20158325135707855, "train/contrastive_loss": 1.7320866584777832, "train/negative_loss": 1.474867820739746, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.2572188675403595, "train/total_loss": 0.5480005741119385 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.19087320566177368, "train/contrastive_loss": 1.4457511901855469, "train/negative_loss": 1.4266146421432495, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.019136596471071243, "train/total_loss": 0.48002344369888306 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1796512007713318, "train/contrastive_loss": 0.326382040977478, "train/negative_loss": 0.26966819167137146, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.05671383813023567, "train/total_loss": 0.24492761492729187 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.24396435916423798, "train/contrastive_loss": 2.816596508026123, "train/negative_loss": 1.7620964050292969, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.0545001029968262, "train/total_loss": 0.8072836995124817 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.17636483907699585, "train/contrastive_loss": 0.4791860580444336, "train/negative_loss": 0.4780164659023285, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0011696013389155269, "train/total_loss": 0.2722020447254181 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.18084284663200378, "train/contrastive_loss": 1.3591601848602295, "train/negative_loss": 1.2169331312179565, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.14222702383995056, "train/total_loss": 0.45267489552497864 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1617814600467682, "train/contrastive_loss": 3.6317224502563477, "train/negative_loss": 2.2193636894226074, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.4123586416244507, "train/total_loss": 0.888126015663147 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1851709932088852, "train/contrastive_loss": 1.976389765739441, "train/negative_loss": 1.21761953830719, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.758770227432251, "train/total_loss": 0.5804489254951477 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.20561179518699646, "train/contrastive_loss": 2.7897727489471436, "train/negative_loss": 1.7173573970794678, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 1.0724153518676758, "train/total_loss": 0.7635663747787476 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.22046226263046265, "train/contrastive_loss": 1.4839712381362915, "train/negative_loss": 0.8525365591049194, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.6314346790313721, "train/total_loss": 0.517256498336792 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1314994841814041, "train/contrastive_loss": 1.818369746208191, "train/negative_loss": 1.8179841041564941, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.0003856798866763711, "train/total_loss": 0.49517345428466797 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.18952886760234833, "train/contrastive_loss": 1.2846763134002686, "train/negative_loss": 0.6666244268417358, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.6180518865585327, "train/total_loss": 0.4464641213417053 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.2132207304239273, "train/contrastive_loss": 2.0742974281311035, "train/negative_loss": 1.8339942693710327, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.24030321836471558, "train/total_loss": 0.6280802488327026 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1913914680480957, "train/contrastive_loss": 1.423677682876587, "train/negative_loss": 0.5711107850074768, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.8525668382644653, "train/total_loss": 0.4761269986629486 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.23982155323028564, "train/contrastive_loss": 3.3509202003479004, "train/negative_loss": 2.2825989723205566, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.0683211088180542, "train/total_loss": 0.9100056290626526 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.14049109816551208, "train/contrastive_loss": 1.6200203895568848, "train/negative_loss": 0.668586254119873, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.9514341354370117, "train/total_loss": 0.4644951820373535 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.20000284910202026, "train/contrastive_loss": 2.8137998580932617, "train/negative_loss": 1.6145503520965576, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.1992496252059937, "train/total_loss": 0.7627628445625305 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1838768720626831, "train/contrastive_loss": 0.7084023356437683, "train/negative_loss": 0.7078876495361328, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0005146655021235347, "train/total_loss": 0.3255573511123657 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.23325423896312714, "train/contrastive_loss": 1.3782320022583008, "train/negative_loss": 1.2698296308517456, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.10840240120887756, "train/total_loss": 0.5089006423950195 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1684018224477768, "train/contrastive_loss": 1.2575197219848633, "train/negative_loss": 0.8483104705810547, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.4092091917991638, "train/total_loss": 0.41990578174591064 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.32005971670150757, "train/contrastive_loss": 2.315727710723877, "train/negative_loss": 1.217613935470581, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.0981138944625854, "train/total_loss": 0.7832052707672119 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1508641541004181, "train/contrastive_loss": 1.903778076171875, "train/negative_loss": 1.145056128501892, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.7587219476699829, "train/total_loss": 0.5316197872161865 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1702166199684143, "train/contrastive_loss": 2.458134174346924, "train/negative_loss": 2.1708731651306152, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.2872610092163086, "train/total_loss": 0.6618434190750122 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.2776569724082947, "train/contrastive_loss": 2.454988956451416, "train/negative_loss": 2.454987049102783, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 1.9073504518019035e-06, "train/total_loss": 0.7686547636985779 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.19200481474399567, "train/contrastive_loss": 3.16558837890625, "train/negative_loss": 1.7555313110351562, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.4100570678710938, "train/total_loss": 0.8251224756240845 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.17200742661952972, "train/contrastive_loss": 0.1734849363565445, "train/negative_loss": 0.11128728836774826, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.062197647988796234, "train/total_loss": 0.20670440793037415 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.18401043117046356, "train/contrastive_loss": 0.8526637554168701, "train/negative_loss": 0.8036697506904602, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.0489940345287323, "train/total_loss": 0.35454317927360535 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.20552721619606018, "train/contrastive_loss": 1.5434834957122803, "train/negative_loss": 1.0935592651367188, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.4499242901802063, "train/total_loss": 0.5142239332199097 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.29712027311325073, "train/contrastive_loss": 2.836956262588501, "train/negative_loss": 1.22115159034729, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.615804672241211, "train/total_loss": 0.8645115494728088 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.15018239617347717, "train/contrastive_loss": 0.6867485046386719, "train/negative_loss": 0.39466720819473267, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.2920812666416168, "train/total_loss": 0.28753209114074707 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.13760094344615936, "train/contrastive_loss": 1.0253562927246094, "train/negative_loss": 0.35280925035476685, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.6725470423698425, "train/total_loss": 0.342672199010849 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.15657001733779907, "train/contrastive_loss": 1.6581045389175415, "train/negative_loss": 0.7265006899833679, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.9316038489341736, "train/total_loss": 0.4881909191608429 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.18820948898792267, "train/contrastive_loss": 1.6809914112091064, "train/negative_loss": 1.2318156957626343, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.44917571544647217, "train/total_loss": 0.5244078040122986 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.19504046440124512, "train/contrastive_loss": 1.5233054161071777, "train/negative_loss": 0.8468884825706482, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.6764168739318848, "train/total_loss": 0.4997015595436096 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.11603426188230515, "train/contrastive_loss": 0.686326265335083, "train/negative_loss": 0.6851330995559692, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.0011931576300412416, "train/total_loss": 0.2532995045185089 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.17929503321647644, "train/contrastive_loss": 2.505115509033203, "train/negative_loss": 1.4139941930770874, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.0911211967468262, "train/total_loss": 0.6803181171417236 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.2623046338558197, "train/contrastive_loss": 2.517824172973633, "train/negative_loss": 1.8878295421600342, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.6299946904182434, "train/total_loss": 0.7658694982528687 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.14070263504981995, "train/contrastive_loss": 2.1426305770874023, "train/negative_loss": 1.158164381980896, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.9844663143157959, "train/total_loss": 0.5692287683486938 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.20783792436122894, "train/contrastive_loss": 1.9898386001586914, "train/negative_loss": 1.4247000217437744, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.565138578414917, "train/total_loss": 0.6058056354522705 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.17116650938987732, "train/contrastive_loss": 2.381537914276123, "train/negative_loss": 0.7003723382949829, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.6811656951904297, "train/total_loss": 0.6474741101264954 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1755324751138687, "train/contrastive_loss": 4.940838813781738, "train/negative_loss": 4.9408369064331055, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 1.7762209836291731e-06, "train/total_loss": 1.1637002229690552 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.1799212545156479, "train/contrastive_loss": 2.2084808349609375, "train/negative_loss": 0.6446971297264099, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.5637837648391724, "train/total_loss": 0.6216174364089966 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.212065190076828, "train/contrastive_loss": 2.409909725189209, "train/negative_loss": 1.4343678951263428, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.9755419492721558, "train/total_loss": 0.6940471529960632 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.16545768082141876, "train/contrastive_loss": 2.4944605827331543, "train/negative_loss": 1.2136564254760742, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.28080415725708, "train/total_loss": 0.6643497943878174 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.25046831369400024, "train/contrastive_loss": 2.2382519245147705, "train/negative_loss": 2.17216157913208, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.06609038263559341, "train/total_loss": 0.6981186866760254 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.17515461146831512, "train/contrastive_loss": 2.257793426513672, "train/negative_loss": 1.4612540006637573, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.7965394854545593, "train/total_loss": 0.6267132759094238 }, { "epoch": 9.154929577464788, "eval_exact_match_accuracy": 0.2857142857142857, "eval_hamming_loss": 0.06774561676522461, "eval_loss": 0.5803765058517456, "eval_macro_f1": 0.36105497113614543, "eval_macro_precision": 0.5920739147438296, "eval_macro_recall": 0.2825809175403302, "eval_micro_f1": 0.5291997116077866, "eval_micro_precision": 0.8173719376391982, "eval_micro_recall": 0.39125799573560766, "eval_runtime": 2.8565, "eval_samples_per_second": 198.492, "eval_steps_per_second": 24.855, "step": 2600 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.16526037454605103, "train/contrastive_loss": 0.768109917640686, "train/negative_loss": 0.6881194710731506, "train/num_negatives": 44, "train/num_positives": 10, "train/positive_loss": 0.0799904614686966, "train/total_loss": 0.3188823461532593 }, { "epoch": 9.154929577464788, "step": 2600, "train/classification_loss": 0.14416836202144623, "train/contrastive_loss": 1.0418167114257812, "train/negative_loss": 0.7043741941452026, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.33744245767593384, "train/total_loss": 0.35253170132637024 }, { "epoch": 9.330985915492958, "grad_norm": 9.925588607788086, "learning_rate": 1.9641155743481327e-05, "loss": 0.6413, "step": 2650 }, { "epoch": 9.330985915492958, "step": 2650, "train/classification_loss": 0.1666610985994339, "train/contrastive_loss": 0.6737055778503418, "train/negative_loss": 0.40825411677360535, "train/num_negatives": 38, "train/num_positives": 18, "train/positive_loss": 0.26545149087905884, "train/total_loss": 0.30140221118927 }, { "epoch": 9.330985915492958, "step": 2650, "train/classification_loss": 0.12780001759529114, "train/contrastive_loss": 0.5189247727394104, "train/negative_loss": 0.5179834365844727, "train/num_negatives": 36, "train/num_positives": 20, "train/positive_loss": 0.0009413353982381523, "train/total_loss": 0.23158496618270874 }, { "epoch": 9.507042253521126, "grad_norm": 8.174408912658691, "learning_rate": 1.9634108527131786e-05, "loss": 0.683, "step": 2700 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.24618496000766754, "train/contrastive_loss": 2.3181824684143066, "train/negative_loss": 1.2733820676803589, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.0448005199432373, "train/total_loss": 0.7098214626312256 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.24503618478775024, "train/contrastive_loss": 0.7689821720123291, "train/negative_loss": 0.7245208024978638, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.04446136951446533, "train/total_loss": 0.39883261919021606 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.23767878115177155, "train/contrastive_loss": 2.9527482986450195, "train/negative_loss": 1.5046037435531616, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.4481446743011475, "train/total_loss": 0.8282284140586853 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1498671919107437, "train/contrastive_loss": 1.6355702877044678, "train/negative_loss": 1.4459677934646606, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.18960247933864594, "train/total_loss": 0.4769812822341919 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.19280041754245758, "train/contrastive_loss": 2.824444055557251, "train/negative_loss": 2.696667432785034, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.1277766227722168, "train/total_loss": 0.7576892375946045 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.2015714794397354, "train/contrastive_loss": 2.269200325012207, "train/negative_loss": 1.5796488523483276, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.6895513534545898, "train/total_loss": 0.6554115414619446 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1885913759469986, "train/contrastive_loss": 1.3630460500717163, "train/negative_loss": 0.7901840209960938, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.5728620290756226, "train/total_loss": 0.4612005949020386 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.18265803158283234, "train/contrastive_loss": 1.1519484519958496, "train/negative_loss": 1.1519181728363037, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 3.027961793122813e-05, "train/total_loss": 0.413047730922699 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.11412450671195984, "train/contrastive_loss": 0.6452596783638, "train/negative_loss": 0.45017990469932556, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.19507978856563568, "train/total_loss": 0.2431764453649521 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.20929855108261108, "train/contrastive_loss": 2.9067678451538086, "train/negative_loss": 2.310359239578247, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.5964085459709167, "train/total_loss": 0.7906521558761597 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.13452234864234924, "train/contrastive_loss": 0.902179479598999, "train/negative_loss": 0.753136396408081, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.14904308319091797, "train/total_loss": 0.31495824456214905 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.17940469086170197, "train/contrastive_loss": 3.0230913162231445, "train/negative_loss": 1.974744200706482, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.0483472347259521, "train/total_loss": 0.7840229272842407 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.21684207022190094, "train/contrastive_loss": 4.046243667602539, "train/negative_loss": 2.533534288406372, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.512709617614746, "train/total_loss": 1.0260908603668213 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.15810632705688477, "train/contrastive_loss": 1.295092225074768, "train/negative_loss": 0.8452231287956238, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.4498691260814667, "train/total_loss": 0.41712477803230286 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.13270686566829681, "train/contrastive_loss": 2.3346595764160156, "train/negative_loss": 0.6693814396858215, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.6652781963348389, "train/total_loss": 0.5996387600898743 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.15910740196704865, "train/contrastive_loss": 0.9473980665206909, "train/negative_loss": 0.5109848976135254, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.4364131689071655, "train/total_loss": 0.3485870361328125 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.10971515625715256, "train/contrastive_loss": 1.065409541130066, "train/negative_loss": 0.6277315616607666, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4376779794692993, "train/total_loss": 0.3227970600128174 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.22380180656909943, "train/contrastive_loss": 2.012408494949341, "train/negative_loss": 0.6866670250892639, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 1.3257414102554321, "train/total_loss": 0.6262835264205933 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.14739564061164856, "train/contrastive_loss": 0.718749463558197, "train/negative_loss": 0.6504449248313904, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.06830452382564545, "train/total_loss": 0.29114553332328796 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.20180334150791168, "train/contrastive_loss": 3.0506796836853027, "train/negative_loss": 1.5672178268432617, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.4834619760513306, "train/total_loss": 0.8119392991065979 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.13206076622009277, "train/contrastive_loss": 2.2139627933502197, "train/negative_loss": 2.194715738296509, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.019246986135840416, "train/total_loss": 0.5748533010482788 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.13065706193447113, "train/contrastive_loss": 2.7108256816864014, "train/negative_loss": 2.2679407596588135, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.4428848624229431, "train/total_loss": 0.6728222370147705 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.16608917713165283, "train/contrastive_loss": 2.4329495429992676, "train/negative_loss": 1.4563369750976562, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.9766125679016113, "train/total_loss": 0.6526790857315063 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.2685789167881012, "train/contrastive_loss": 4.244009017944336, "train/negative_loss": 2.465100049972534, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.7789090871810913, "train/total_loss": 1.1173807382583618 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.17535828053951263, "train/contrastive_loss": 1.419189691543579, "train/negative_loss": 1.1602553129196167, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.2589344084262848, "train/total_loss": 0.45919620990753174 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.21858078241348267, "train/contrastive_loss": 3.189957618713379, "train/negative_loss": 2.247539520263672, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.9424179792404175, "train/total_loss": 0.8565723299980164 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.19780108332633972, "train/contrastive_loss": 2.1977226734161377, "train/negative_loss": 2.1974360942840576, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.000286687194602564, "train/total_loss": 0.6373456120491028 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.18451203405857086, "train/contrastive_loss": 0.856658935546875, "train/negative_loss": 0.8316022753715515, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.025056643411517143, "train/total_loss": 0.35584384202957153 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.2588823437690735, "train/contrastive_loss": 2.892712116241455, "train/negative_loss": 1.6340378522872925, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.258674144744873, "train/total_loss": 0.8374247550964355 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1945541948080063, "train/contrastive_loss": 0.9771105647087097, "train/negative_loss": 0.9692712426185608, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.007839331403374672, "train/total_loss": 0.3899763226509094 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1904030442237854, "train/contrastive_loss": 1.8278334140777588, "train/negative_loss": 1.5663201808929443, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.2615131735801697, "train/total_loss": 0.5559697151184082 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1648002415895462, "train/contrastive_loss": 2.4086363315582275, "train/negative_loss": 2.3721089363098145, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.03652748838067055, "train/total_loss": 0.6465275287628174 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.184440016746521, "train/contrastive_loss": 2.1555018424987793, "train/negative_loss": 1.4502166509628296, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.7052853107452393, "train/total_loss": 0.6155403852462769 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.21587824821472168, "train/contrastive_loss": 2.5807929039001465, "train/negative_loss": 1.667168378829956, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.9136244654655457, "train/total_loss": 0.732036828994751 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.24265708029270172, "train/contrastive_loss": 1.4171247482299805, "train/negative_loss": 0.9620932340621948, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.45503151416778564, "train/total_loss": 0.5260820388793945 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.14479337632656097, "train/contrastive_loss": 2.200500249862671, "train/negative_loss": 2.2004213333129883, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 7.887629908509552e-05, "train/total_loss": 0.5848934054374695 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1943824738264084, "train/contrastive_loss": 1.702411413192749, "train/negative_loss": 0.810370147228241, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.8920413255691528, "train/total_loss": 0.5348647832870483 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.21114720404148102, "train/contrastive_loss": 1.6703277826309204, "train/negative_loss": 1.5292900800704956, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.14103767275810242, "train/total_loss": 0.5452127456665039 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.19728179275989532, "train/contrastive_loss": 0.6125668883323669, "train/negative_loss": 0.46839651465415955, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.1441703587770462, "train/total_loss": 0.319795161485672 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.29019972681999207, "train/contrastive_loss": 4.630445957183838, "train/negative_loss": 1.6993427276611328, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.931103229522705, "train/total_loss": 1.2162889242172241 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1425984799861908, "train/contrastive_loss": 1.1256687641143799, "train/negative_loss": 0.8306665420532227, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.29500219225883484, "train/total_loss": 0.3677322268486023 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.19690319895744324, "train/contrastive_loss": 2.0265026092529297, "train/negative_loss": 1.3792775869369507, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.647225022315979, "train/total_loss": 0.6022037267684937 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.16565266251564026, "train/contrastive_loss": 0.9898386597633362, "train/negative_loss": 0.989719808101654, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.00011883485422004014, "train/total_loss": 0.363620400428772 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.275462806224823, "train/contrastive_loss": 1.6302192211151123, "train/negative_loss": 0.9540430307388306, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.6761762499809265, "train/total_loss": 0.6015066504478455 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.16976973414421082, "train/contrastive_loss": 2.2232112884521484, "train/negative_loss": 2.210834264755249, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.01237698458135128, "train/total_loss": 0.6144120097160339 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.32502618432044983, "train/contrastive_loss": 2.4733924865722656, "train/negative_loss": 1.3015379905700684, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.1718544960021973, "train/total_loss": 0.8197046518325806 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.17891135811805725, "train/contrastive_loss": 3.392833948135376, "train/negative_loss": 1.1546037197113037, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 2.2382302284240723, "train/total_loss": 0.857478141784668 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.18559923768043518, "train/contrastive_loss": 3.554265022277832, "train/negative_loss": 2.835493326187134, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7187715768814087, "train/total_loss": 0.8964523077011108 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.25483810901641846, "train/contrastive_loss": 2.615293502807617, "train/negative_loss": 2.6152801513671875, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 1.3232318451628089e-05, "train/total_loss": 0.7778968214988708 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.19435539841651917, "train/contrastive_loss": 2.512592077255249, "train/negative_loss": 0.9203905463218689, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.5922014713287354, "train/total_loss": 0.6968737840652466 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1328953057527542, "train/contrastive_loss": 0.22658661007881165, "train/negative_loss": 0.11732051521539688, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.10926608741283417, "train/total_loss": 0.17821262776851654 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.19937169551849365, "train/contrastive_loss": 1.1343051195144653, "train/negative_loss": 1.110209345817566, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.024095721542835236, "train/total_loss": 0.4262327253818512 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.18528319895267487, "train/contrastive_loss": 1.4506970643997192, "train/negative_loss": 1.4143707752227783, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.036326318979263306, "train/total_loss": 0.47542262077331543 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.3076325058937073, "train/contrastive_loss": 3.3048787117004395, "train/negative_loss": 1.1579900979995728, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 2.146888494491577, "train/total_loss": 0.9686082601547241 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.13595907390117645, "train/contrastive_loss": 0.7254592180252075, "train/negative_loss": 0.5122767090797424, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.2131824940443039, "train/total_loss": 0.2810509204864502 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.11226639896631241, "train/contrastive_loss": 0.4652174413204193, "train/negative_loss": 0.4139293432235718, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.05128810182213783, "train/total_loss": 0.2053098976612091 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1604146659374237, "train/contrastive_loss": 2.3324451446533203, "train/negative_loss": 1.2000235319137573, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.1324217319488525, "train/total_loss": 0.6269037127494812 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.2118668407201767, "train/contrastive_loss": 3.014366626739502, "train/negative_loss": 1.657504916191101, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.3568618297576904, "train/total_loss": 0.8147401809692383 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.18209993839263916, "train/contrastive_loss": 0.9660111665725708, "train/negative_loss": 0.7024995684623718, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.26351162791252136, "train/total_loss": 0.37530219554901123 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.11673104017972946, "train/contrastive_loss": 0.6742532253265381, "train/negative_loss": 0.40294432640075684, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.27130889892578125, "train/total_loss": 0.25158169865608215 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.19410599768161774, "train/contrastive_loss": 2.5448427200317383, "train/negative_loss": 1.4728997945785522, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.0719430446624756, "train/total_loss": 0.7030745148658752 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.255287766456604, "train/contrastive_loss": 1.4933267831802368, "train/negative_loss": 1.1634098291397095, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.32991698384284973, "train/total_loss": 0.5539531707763672 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.13877858221530914, "train/contrastive_loss": 1.856605887413025, "train/negative_loss": 1.4671188592910767, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.38948702812194824, "train/total_loss": 0.5100997686386108 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1751866638660431, "train/contrastive_loss": 0.5172592401504517, "train/negative_loss": 0.45144206285476685, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.0658172070980072, "train/total_loss": 0.2786385118961334 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.16447676718235016, "train/contrastive_loss": 1.8310130834579468, "train/negative_loss": 0.4243212640285492, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.4066917896270752, "train/total_loss": 0.5306794047355652 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.16225150227546692, "train/contrastive_loss": 4.991938591003418, "train/negative_loss": 4.991936683654785, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 1.9431149667070713e-06, "train/total_loss": 1.1606392860412598 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1687004566192627, "train/contrastive_loss": 1.6625807285308838, "train/negative_loss": 0.4287572503089905, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.233823537826538, "train/total_loss": 0.5012166500091553 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.21064788103103638, "train/contrastive_loss": 2.6139304637908936, "train/negative_loss": 2.035810947418213, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.5781194567680359, "train/total_loss": 0.7334339618682861 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.1537582129240036, "train/contrastive_loss": 1.8837095499038696, "train/negative_loss": 0.9978513121604919, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.8858582377433777, "train/total_loss": 0.5305001139640808 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.2564479112625122, "train/contrastive_loss": 1.8451323509216309, "train/negative_loss": 1.3986173868179321, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.44651490449905396, "train/total_loss": 0.6254743933677673 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.18230153620243073, "train/contrastive_loss": 1.692655324935913, "train/negative_loss": 1.628920078277588, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.06373518705368042, "train/total_loss": 0.5208325982093811 }, { "epoch": 9.507042253521126, "eval_exact_match_accuracy": 0.2786596119929453, "eval_hamming_loss": 0.07127295362589481, "eval_loss": 0.5910915732383728, "eval_macro_f1": 0.3399007092993409, "eval_macro_precision": 0.560983161895091, "eval_macro_recall": 0.26820156138559786, "eval_micro_f1": 0.5178947368421053, "eval_micro_precision": 0.757700205338809, "eval_micro_recall": 0.39339019189765456, "eval_runtime": 2.8413, "eval_samples_per_second": 199.56, "eval_steps_per_second": 24.989, "step": 2700 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.12901562452316284, "train/contrastive_loss": 0.8175753951072693, "train/negative_loss": 0.8139306902885437, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.003644683165475726, "train/total_loss": 0.29253071546554565 }, { "epoch": 9.507042253521126, "step": 2700, "train/classification_loss": 0.15829998254776, "train/contrastive_loss": 1.8234858512878418, "train/negative_loss": 1.3036770820617676, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.5198087096214294, "train/total_loss": 0.5229971408843994 }, { "epoch": 9.683098591549296, "grad_norm": 9.153973579406738, "learning_rate": 1.9627061310782244e-05, "loss": 0.6411, "step": 2750 }, { "epoch": 9.683098591549296, "step": 2750, "train/classification_loss": 0.11858583986759186, "train/contrastive_loss": 0.4542088508605957, "train/negative_loss": 0.40345609188079834, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.050752751529216766, "train/total_loss": 0.209427610039711 }, { "epoch": 9.683098591549296, "step": 2750, "train/classification_loss": 0.08259477466344833, "train/contrastive_loss": 0.3632351756095886, "train/negative_loss": 0.35160335898399353, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.011631814762949944, "train/total_loss": 0.15524181723594666 }, { "epoch": 9.859154929577464, "grad_norm": 10.849760055541992, "learning_rate": 1.96200140944327e-05, "loss": 0.6916, "step": 2800 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2422458976507187, "train/contrastive_loss": 1.721174716949463, "train/negative_loss": 1.2936679124832153, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.4275067448616028, "train/total_loss": 0.5864808559417725 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2578805983066559, "train/contrastive_loss": 0.9033896923065186, "train/negative_loss": 0.4029536247253418, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.5004360675811768, "train/total_loss": 0.43855851888656616 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2397628128528595, "train/contrastive_loss": 2.841975450515747, "train/negative_loss": 1.3694028854370117, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.4725725650787354, "train/total_loss": 0.8081579208374023 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.14542058110237122, "train/contrastive_loss": 2.0952982902526855, "train/negative_loss": 1.056650161743164, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.038648247718811, "train/total_loss": 0.5644802451133728 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.1968403160572052, "train/contrastive_loss": 2.0891003608703613, "train/negative_loss": 1.5229990482330322, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.5661011934280396, "train/total_loss": 0.614660382270813 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.19998688995838165, "train/contrastive_loss": 2.3039064407348633, "train/negative_loss": 1.2318562269210815, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.0720502138137817, "train/total_loss": 0.6607682108879089 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.17715367674827576, "train/contrastive_loss": 1.472278356552124, "train/negative_loss": 0.7979770302772522, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.674301266670227, "train/total_loss": 0.47160935401916504 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.18147341907024384, "train/contrastive_loss": 0.7004166841506958, "train/negative_loss": 0.6988470554351807, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.0015696082264184952, "train/total_loss": 0.3215567469596863 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.10392995178699493, "train/contrastive_loss": 0.953577995300293, "train/negative_loss": 0.30992963910102844, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.6436483860015869, "train/total_loss": 0.2946455478668213 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.18369993567466736, "train/contrastive_loss": 2.3295676708221436, "train/negative_loss": 1.3953849077224731, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.9341827630996704, "train/total_loss": 0.6496134996414185 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.1467398703098297, "train/contrastive_loss": 1.3287410736083984, "train/negative_loss": 0.6292564868927002, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.6994845271110535, "train/total_loss": 0.41248810291290283 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.16137251257896423, "train/contrastive_loss": 1.925856113433838, "train/negative_loss": 1.0077437162399292, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.9181124567985535, "train/total_loss": 0.5465437173843384 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.20013026893138885, "train/contrastive_loss": 3.637685775756836, "train/negative_loss": 1.4786475896835327, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.1590380668640137, "train/total_loss": 0.9276674389839172 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.16525375843048096, "train/contrastive_loss": 1.4299119710922241, "train/negative_loss": 0.6464141607284546, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.7834978103637695, "train/total_loss": 0.45123615860939026 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.14059491455554962, "train/contrastive_loss": 3.1143014430999756, "train/negative_loss": 0.7113563418388367, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.402945041656494, "train/total_loss": 0.7634552121162415 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.15830004215240479, "train/contrastive_loss": 1.034705400466919, "train/negative_loss": 0.2746495008468628, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.7600558996200562, "train/total_loss": 0.3652411103248596 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.12019146233797073, "train/contrastive_loss": 1.1123141050338745, "train/negative_loss": 0.4054318368434906, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7068822383880615, "train/total_loss": 0.342654287815094 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.19889847934246063, "train/contrastive_loss": 1.3846909999847412, "train/negative_loss": 0.5369450449943542, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.8477458953857422, "train/total_loss": 0.47583669424057007 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.14434264600276947, "train/contrastive_loss": 0.9681116342544556, "train/negative_loss": 0.36274853348731995, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.6053630709648132, "train/total_loss": 0.3379649817943573 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.21232929825782776, "train/contrastive_loss": 3.307300090789795, "train/negative_loss": 1.3321508169174194, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.975149393081665, "train/total_loss": 0.8737893104553223 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.1258581280708313, "train/contrastive_loss": 1.1267513036727905, "train/negative_loss": 1.114208459854126, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.0125428456813097, "train/total_loss": 0.3512083888053894 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.13371552526950836, "train/contrastive_loss": 2.8056769371032715, "train/negative_loss": 1.911933422088623, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.893743634223938, "train/total_loss": 0.6948509216308594 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.13864447176456451, "train/contrastive_loss": 1.1586953401565552, "train/negative_loss": 0.8028740286827087, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.3558213412761688, "train/total_loss": 0.3703835606575012 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2527272403240204, "train/contrastive_loss": 3.6967899799346924, "train/negative_loss": 1.8888001441955566, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.8079898357391357, "train/total_loss": 0.9920852184295654 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.16538181900978088, "train/contrastive_loss": 2.630919933319092, "train/negative_loss": 0.9302123188972473, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.7007076740264893, "train/total_loss": 0.6915658712387085 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.23373982310295105, "train/contrastive_loss": 2.723788261413574, "train/negative_loss": 1.5791181325912476, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.144670009613037, "train/total_loss": 0.7784974575042725 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.19584132730960846, "train/contrastive_loss": 2.3939971923828125, "train/negative_loss": 2.336350679397583, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.05764659866690636, "train/total_loss": 0.6746407747268677 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.1803833544254303, "train/contrastive_loss": 0.295193076133728, "train/negative_loss": 0.2837584912776947, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.011434579268097878, "train/total_loss": 0.23942196369171143 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2578928470611572, "train/contrastive_loss": 2.998237371444702, "train/negative_loss": 1.3674235343933105, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.6308138370513916, "train/total_loss": 0.8575403094291687 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.17316599190235138, "train/contrastive_loss": 0.3680519461631775, "train/negative_loss": 0.3675346076488495, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0005173303070478141, "train/total_loss": 0.24677637219429016 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.16192907094955444, "train/contrastive_loss": 1.2288349866867065, "train/negative_loss": 0.8368066549301147, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.3920283615589142, "train/total_loss": 0.40769606828689575 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.1536184400320053, "train/contrastive_loss": 1.9579675197601318, "train/negative_loss": 1.2453473806381226, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.7126200795173645, "train/total_loss": 0.5452119708061218 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.17546148598194122, "train/contrastive_loss": 1.2615089416503906, "train/negative_loss": 0.624224841594696, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.6372841596603394, "train/total_loss": 0.42776328325271606 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2133786827325821, "train/contrastive_loss": 2.3824925422668457, "train/negative_loss": 1.7685984373092651, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.6138941049575806, "train/total_loss": 0.6898772120475769 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2253674566745758, "train/contrastive_loss": 1.4370590448379517, "train/negative_loss": 0.9245150685310364, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.5125439763069153, "train/total_loss": 0.5127792358398438 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.13447359204292297, "train/contrastive_loss": 1.8005852699279785, "train/negative_loss": 1.800480604171753, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.00010467678657732904, "train/total_loss": 0.4945906400680542 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.19570650160312653, "train/contrastive_loss": 1.7497758865356445, "train/negative_loss": 0.5966654419898987, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 1.153110384941101, "train/total_loss": 0.5456616878509521 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2233089953660965, "train/contrastive_loss": 2.3549704551696777, "train/negative_loss": 2.2732763290405273, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.0816941112279892, "train/total_loss": 0.6943030953407288 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2193119078874588, "train/contrastive_loss": 1.410846471786499, "train/negative_loss": 0.5325482487678528, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.8782982230186462, "train/total_loss": 0.5014812350273132 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2568223774433136, "train/contrastive_loss": 4.215339660644531, "train/negative_loss": 1.7484999895095825, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.4668397903442383, "train/total_loss": 1.0998903512954712 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.14489434659481049, "train/contrastive_loss": 1.600229024887085, "train/negative_loss": 0.7183215022087097, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.8819074630737305, "train/total_loss": 0.4649401307106018 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.19604523479938507, "train/contrastive_loss": 3.19573974609375, "train/negative_loss": 1.3959224224090576, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.7998173236846924, "train/total_loss": 0.8351931571960449 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.15760312974452972, "train/contrastive_loss": 0.4566722810268402, "train/negative_loss": 0.45651084184646606, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.00016143334505613893, "train/total_loss": 0.24893757700920105 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.23440247774124146, "train/contrastive_loss": 0.9202690124511719, "train/negative_loss": 0.6256960034370422, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.29457297921180725, "train/total_loss": 0.4184562861919403 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.18507640063762665, "train/contrastive_loss": 2.756464719772339, "train/negative_loss": 2.0327699184417725, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.7236948013305664, "train/total_loss": 0.7363693714141846 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.3184349834918976, "train/contrastive_loss": 1.9404232501983643, "train/negative_loss": 0.8505808115005493, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.089842438697815, "train/total_loss": 0.706519603729248 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.15520323812961578, "train/contrastive_loss": 2.6822690963745117, "train/negative_loss": 0.999466061592102, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.6828030347824097, "train/total_loss": 0.6916570663452148 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.18790845572948456, "train/contrastive_loss": 2.603407859802246, "train/negative_loss": 2.186038017272949, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4173697233200073, "train/total_loss": 0.708590030670166 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.26583942770957947, "train/contrastive_loss": 2.217435121536255, "train/negative_loss": 2.2174315452575684, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 3.57628505298635e-06, "train/total_loss": 0.709326446056366 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.2037402093410492, "train/contrastive_loss": 2.2504491806030273, "train/negative_loss": 1.1650561094284058, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.0853931903839111, "train/total_loss": 0.6538300514221191 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.1263217329978943, "train/contrastive_loss": 0.14254340529441833, "train/negative_loss": 0.08723662793636322, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.05530676990747452, "train/total_loss": 0.15483041107654572 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.19413205981254578, "train/contrastive_loss": 0.9580098986625671, "train/negative_loss": 0.7995215058326721, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.15848837792873383, "train/total_loss": 0.38573402166366577 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.1995437741279602, "train/contrastive_loss": 1.3031272888183594, "train/negative_loss": 1.10425865650177, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.19886858761310577, "train/total_loss": 0.4601692259311676 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.3115212023258209, "train/contrastive_loss": 2.1659932136535645, "train/negative_loss": 1.0569956302642822, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.1089975833892822, "train/total_loss": 0.7447198629379272 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.13202039897441864, "train/contrastive_loss": 0.6856703758239746, "train/negative_loss": 0.4037132263183594, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.28195711970329285, "train/total_loss": 0.26915448904037476 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.13055665791034698, "train/contrastive_loss": 0.8618555665016174, "train/negative_loss": 0.422348290681839, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.43950727581977844, "train/total_loss": 0.30292779207229614 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.15074796974658966, "train/contrastive_loss": 1.8078230619430542, "train/negative_loss": 0.6606121063232422, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.147210955619812, "train/total_loss": 0.5123125910758972 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.189544677734375, "train/contrastive_loss": 2.6949150562286377, "train/negative_loss": 1.2093682289123535, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.4855468273162842, "train/total_loss": 0.7285277247428894 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.1958393156528473, "train/contrastive_loss": 1.5279107093811035, "train/negative_loss": 0.6890113353729248, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.8388993144035339, "train/total_loss": 0.5014214515686035 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.09453032165765762, "train/contrastive_loss": 0.47734537720680237, "train/negative_loss": 0.1615724265575409, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.3157729506492615, "train/total_loss": 0.18999940156936646 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.19003990292549133, "train/contrastive_loss": 2.1613221168518066, "train/negative_loss": 1.2775293588638306, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.8837928771972656, "train/total_loss": 0.6223043203353882 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.250262051820755, "train/contrastive_loss": 1.6377253532409668, "train/negative_loss": 0.8702628016471863, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.7674626111984253, "train/total_loss": 0.5778071284294128 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.14335666596889496, "train/contrastive_loss": 1.5191998481750488, "train/negative_loss": 0.9416450262069702, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.5775548219680786, "train/total_loss": 0.4471966624259949 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.20338916778564453, "train/contrastive_loss": 0.7640072703361511, "train/negative_loss": 0.5475155711174011, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.2164916843175888, "train/total_loss": 0.35619062185287476 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.17595137655735016, "train/contrastive_loss": 2.362671375274658, "train/negative_loss": 0.6120171546936035, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.7506542205810547, "train/total_loss": 0.6484856605529785 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.16194500029087067, "train/contrastive_loss": 4.332770347595215, "train/negative_loss": 4.33276891708374, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 1.466275875827705e-06, "train/total_loss": 1.0284991264343262 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.17135140299797058, "train/contrastive_loss": 1.140178918838501, "train/negative_loss": 0.3936411142349243, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.7465378642082214, "train/total_loss": 0.3993871808052063 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.19975849986076355, "train/contrastive_loss": 2.2232303619384766, "train/negative_loss": 1.2000625133514404, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0231679677963257, "train/total_loss": 0.6444045901298523 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.1608150750398636, "train/contrastive_loss": 2.643754482269287, "train/negative_loss": 0.8494847416877747, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.7942698001861572, "train/total_loss": 0.6895659565925598 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.24466247856616974, "train/contrastive_loss": 1.6202069520950317, "train/negative_loss": 0.9127046465873718, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.7075023055076599, "train/total_loss": 0.5687038898468018 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.16331139206886292, "train/contrastive_loss": 0.4944665729999542, "train/negative_loss": 0.41176989674568176, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.08269666880369186, "train/total_loss": 0.26220470666885376 }, { "epoch": 9.859154929577464, "eval_exact_match_accuracy": 0.2892416225749559, "eval_hamming_loss": 0.06795310716879345, "eval_loss": 0.5553329586982727, "eval_macro_f1": 0.3898906591099431, "eval_macro_precision": 0.6353736023298848, "eval_macro_recall": 0.3207501530327882, "eval_micro_f1": 0.5416375087473758, "eval_micro_precision": 0.7881873727087576, "eval_micro_recall": 0.4125799573560768, "eval_runtime": 2.8425, "eval_samples_per_second": 199.47, "eval_steps_per_second": 24.978, "step": 2800 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.19349829852581024, "train/contrastive_loss": 1.3443948030471802, "train/negative_loss": 0.7074541449546814, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.6369406580924988, "train/total_loss": 0.46237725019454956 }, { "epoch": 9.859154929577464, "step": 2800, "train/classification_loss": 0.14223407208919525, "train/contrastive_loss": 0.6640971899032593, "train/negative_loss": 0.6640753746032715, "train/num_negatives": 52, "train/num_positives": 2, "train/positive_loss": 2.1815538275404833e-05, "train/total_loss": 0.2750535011291504 }, { "epoch": 10.035211267605634, "grad_norm": 7.347024440765381, "learning_rate": 1.961296687808316e-05, "loss": 0.6289, "step": 2850 }, { "epoch": 10.035211267605634, "step": 2850, "train/classification_loss": 0.16506929695606232, "train/contrastive_loss": 0.8735600113868713, "train/negative_loss": 0.27111417055130005, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.6024458408355713, "train/total_loss": 0.3397812843322754 }, { "epoch": 10.035211267605634, "step": 2850, "train/classification_loss": 0.16181811690330505, "train/contrastive_loss": 0.7897449731826782, "train/negative_loss": 0.5512301325798035, "train/num_negatives": 24, "train/num_positives": 24, "train/positive_loss": 0.23851487040519714, "train/total_loss": 0.3197671175003052 }, { "epoch": 10.211267605633802, "grad_norm": 6.384469985961914, "learning_rate": 1.9605919661733618e-05, "loss": 0.6112, "step": 2900 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.2628132700920105, "train/contrastive_loss": 1.5475016832351685, "train/negative_loss": 1.4081183671951294, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.13938328623771667, "train/total_loss": 0.5723136067390442 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.23209384083747864, "train/contrastive_loss": 1.1163294315338135, "train/negative_loss": 0.36060935258865356, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.7557200193405151, "train/total_loss": 0.45535972714424133 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.21153056621551514, "train/contrastive_loss": 3.230170249938965, "train/negative_loss": 2.0683212280273438, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.161849021911621, "train/total_loss": 0.8575646281242371 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.15908098220825195, "train/contrastive_loss": 2.679654598236084, "train/negative_loss": 1.5057131052017212, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.1739414930343628, "train/total_loss": 0.6950119137763977 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.17802831530570984, "train/contrastive_loss": 2.07833194732666, "train/negative_loss": 1.31305992603302, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.7652720212936401, "train/total_loss": 0.5936946868896484 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.20847803354263306, "train/contrastive_loss": 2.733017683029175, "train/negative_loss": 1.0552629232406616, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.6777547597885132, "train/total_loss": 0.7550815939903259 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.17177040874958038, "train/contrastive_loss": 1.7280198335647583, "train/negative_loss": 0.7447405457496643, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.983279287815094, "train/total_loss": 0.5173743963241577 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.17218448221683502, "train/contrastive_loss": 0.8346590995788574, "train/negative_loss": 0.834532618522644, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.0001264890597667545, "train/total_loss": 0.33911630511283875 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.1112944632768631, "train/contrastive_loss": 1.037398338317871, "train/negative_loss": 0.5850278735160828, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.4523704946041107, "train/total_loss": 0.31877413392066956 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.16975441575050354, "train/contrastive_loss": 2.80088210105896, "train/negative_loss": 1.5928813219070435, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.2080007791519165, "train/total_loss": 0.7299308776855469 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.13797059655189514, "train/contrastive_loss": 2.165200710296631, "train/negative_loss": 0.5847959518432617, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 1.5804046392440796, "train/total_loss": 0.5710107088088989 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.15954400599002838, "train/contrastive_loss": 1.3343087434768677, "train/negative_loss": 1.3209974765777588, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.013311277143657207, "train/total_loss": 0.42640578746795654 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.20986954867839813, "train/contrastive_loss": 4.174795627593994, "train/negative_loss": 1.9875352382659912, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.187260389328003, "train/total_loss": 1.0448286533355713 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.16387797892093658, "train/contrastive_loss": 1.3689451217651367, "train/negative_loss": 0.9319843053817749, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.4369608461856842, "train/total_loss": 0.43766701221466064 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.14226661622524261, "train/contrastive_loss": 3.805375099182129, "train/negative_loss": 0.9238763451576233, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.8814988136291504, "train/total_loss": 0.9033416509628296 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.16320881247520447, "train/contrastive_loss": 0.8691606521606445, "train/negative_loss": 0.3121230900287628, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.5570375323295593, "train/total_loss": 0.3370409607887268 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.1263202279806137, "train/contrastive_loss": 1.771242380142212, "train/negative_loss": 0.5729682445526123, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.1982741355895996, "train/total_loss": 0.48056870698928833 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.16373278200626373, "train/contrastive_loss": 0.30273059010505676, "train/negative_loss": 0.2941136956214905, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.008616908453404903, "train/total_loss": 0.22427889704704285 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.14347781240940094, "train/contrastive_loss": 1.2606143951416016, "train/negative_loss": 0.46871668100357056, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.791897714138031, "train/total_loss": 0.39560067653656006 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.21395543217658997, "train/contrastive_loss": 3.584773540496826, "train/negative_loss": 1.303221344947815, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.2815520763397217, "train/total_loss": 0.9309101104736328 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.13279476761817932, "train/contrastive_loss": 1.4508020877838135, "train/negative_loss": 1.4372400045394897, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.01356208510696888, "train/total_loss": 0.422955185174942 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.13371767103672028, "train/contrastive_loss": 3.249382972717285, "train/negative_loss": 2.452887773513794, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.7964953184127808, "train/total_loss": 0.7835942506790161 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.15158793330192566, "train/contrastive_loss": 1.7863094806671143, "train/negative_loss": 1.6163197755813599, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.169989675283432, "train/total_loss": 0.5088498592376709 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.2671091854572296, "train/contrastive_loss": 2.83126163482666, "train/negative_loss": 1.3494688272476196, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.48179292678833, "train/total_loss": 0.8333615064620972 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.1736839860677719, "train/contrastive_loss": 1.984739065170288, "train/negative_loss": 0.40271276235580444, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.5820263624191284, "train/total_loss": 0.5706318020820618 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.20055411756038666, "train/contrastive_loss": 2.465477466583252, "train/negative_loss": 1.534045934677124, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.9314315319061279, "train/total_loss": 0.6936495900154114 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.1925583779811859, "train/contrastive_loss": 2.431614637374878, "train/negative_loss": 2.1127984523773193, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.3188161551952362, "train/total_loss": 0.6788812875747681 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.18313775956630707, "train/contrastive_loss": 0.34710225462913513, "train/negative_loss": 0.2658122479915619, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.08129000663757324, "train/total_loss": 0.2525582015514374 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.27189186215400696, "train/contrastive_loss": 3.0423965454101562, "train/negative_loss": 1.3593348264694214, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.6830615997314453, "train/total_loss": 0.8803712129592896 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.17986933887004852, "train/contrastive_loss": 0.6659830212593079, "train/negative_loss": 0.6557236909866333, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.010259347967803478, "train/total_loss": 0.31306594610214233 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.18539486825466156, "train/contrastive_loss": 1.5846210718154907, "train/negative_loss": 1.367700457572937, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.21692058444023132, "train/total_loss": 0.5023190975189209 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.14992345869541168, "train/contrastive_loss": 2.1614699363708496, "train/negative_loss": 1.3060417175292969, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.8554282188415527, "train/total_loss": 0.5822174549102783 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.18701496720314026, "train/contrastive_loss": 2.342538595199585, "train/negative_loss": 1.2122130393981934, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.1303255558013916, "train/total_loss": 0.6555227041244507 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.22230593860149384, "train/contrastive_loss": 2.030838966369629, "train/negative_loss": 1.4303054809570312, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.6005334854125977, "train/total_loss": 0.6284737586975098 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.20898309350013733, "train/contrastive_loss": 1.478989839553833, "train/negative_loss": 0.8801543712615967, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.5988355278968811, "train/total_loss": 0.5047810673713684 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.13425864279270172, "train/contrastive_loss": 1.332768440246582, "train/negative_loss": 1.3266702890396118, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.006098171230405569, "train/total_loss": 0.4008123278617859 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.22147367894649506, "train/contrastive_loss": 2.37888240814209, "train/negative_loss": 0.39433708786964417, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 1.984545350074768, "train/total_loss": 0.6972501873970032 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.24031203985214233, "train/contrastive_loss": 3.3356821537017822, "train/negative_loss": 3.214360475540161, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.12132158875465393, "train/total_loss": 0.9074484705924988 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.2125992327928543, "train/contrastive_loss": 1.0687923431396484, "train/negative_loss": 0.4468400478363037, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.6219522356987, "train/total_loss": 0.4263576865196228 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.29739734530448914, "train/contrastive_loss": 4.781063556671143, "train/negative_loss": 2.208695888519287, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.5723676681518555, "train/total_loss": 1.2536100149154663 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.13947837054729462, "train/contrastive_loss": 1.1287579536437988, "train/negative_loss": 0.5803136229515076, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.5484442710876465, "train/total_loss": 0.3652299642562866 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.17628394067287445, "train/contrastive_loss": 2.966888904571533, "train/negative_loss": 1.6621443033218384, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.3047444820404053, "train/total_loss": 0.7696617245674133 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.14822180569171906, "train/contrastive_loss": 0.5378744006156921, "train/negative_loss": 0.5378078818321228, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 6.652127194683999e-05, "train/total_loss": 0.2557966709136963 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.28061428666114807, "train/contrastive_loss": 2.16581392288208, "train/negative_loss": 1.159152865409851, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.0066609382629395, "train/total_loss": 0.7137770652770996 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.15342897176742554, "train/contrastive_loss": 0.7659542560577393, "train/negative_loss": 0.7608383893966675, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.005115843378007412, "train/total_loss": 0.3066198229789734 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.32758885622024536, "train/contrastive_loss": 1.8111205101013184, "train/negative_loss": 0.9260818362236023, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.8850387334823608, "train/total_loss": 0.689812958240509 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.13064444065093994, "train/contrastive_loss": 2.8732028007507324, "train/negative_loss": 0.8690221905708313, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 2.004180669784546, "train/total_loss": 0.7052850127220154 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.16293343901634216, "train/contrastive_loss": 2.437732219696045, "train/negative_loss": 2.081183433532715, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.35654887557029724, "train/total_loss": 0.6504799127578735 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.2592998445034027, "train/contrastive_loss": 2.084942102432251, "train/negative_loss": 2.08493971824646, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 2.2649790025752736e-06, "train/total_loss": 0.6762882471084595 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.2063748985528946, "train/contrastive_loss": 2.7614307403564453, "train/negative_loss": 1.3759068250656128, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.3855239152908325, "train/total_loss": 0.7586610317230225 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.12094295769929886, "train/contrastive_loss": 0.18382498621940613, "train/negative_loss": 0.15728388726711273, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.026541098952293396, "train/total_loss": 0.15770795941352844 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.19040244817733765, "train/contrastive_loss": 1.179012656211853, "train/negative_loss": 0.9204587936401367, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.2585538625717163, "train/total_loss": 0.42620497941970825 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.18006786704063416, "train/contrastive_loss": 1.1357351541519165, "train/negative_loss": 0.9125902056694031, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.22314494848251343, "train/total_loss": 0.407214879989624 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.2964591383934021, "train/contrastive_loss": 3.240980386734009, "train/negative_loss": 1.3075833320617676, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.9333970546722412, "train/total_loss": 0.9446552395820618 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.15920165181159973, "train/contrastive_loss": 0.689811110496521, "train/negative_loss": 0.49601730704307556, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.19379381835460663, "train/total_loss": 0.29716387391090393 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.13423670828342438, "train/contrastive_loss": 1.5894420146942139, "train/negative_loss": 0.7994976043701172, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.7899444699287415, "train/total_loss": 0.4521251320838928 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.14847001433372498, "train/contrastive_loss": 1.1185154914855957, "train/negative_loss": 0.5615684390068054, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.5569469928741455, "train/total_loss": 0.37217313051223755 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.19374050199985504, "train/contrastive_loss": 4.017642021179199, "train/negative_loss": 2.2876029014587402, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.730039119720459, "train/total_loss": 0.9972689151763916 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.19868767261505127, "train/contrastive_loss": 1.0947338342666626, "train/negative_loss": 0.5714030265808105, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.523330807685852, "train/total_loss": 0.41763442754745483 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.08811814337968826, "train/contrastive_loss": 0.2297048419713974, "train/negative_loss": 0.2284664362668991, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.0012384126894176006, "train/total_loss": 0.1340591162443161 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.19191573560237885, "train/contrastive_loss": 2.388416290283203, "train/negative_loss": 1.7922662496566772, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.5961501002311707, "train/total_loss": 0.6695989966392517 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.20889155566692352, "train/contrastive_loss": 1.2571130990982056, "train/negative_loss": 1.2430636882781982, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.014049414545297623, "train/total_loss": 0.46031415462493896 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.1371251493692398, "train/contrastive_loss": 1.5753488540649414, "train/negative_loss": 0.7840390801429749, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.7913098335266113, "train/total_loss": 0.4521949291229248 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.23302072286605835, "train/contrastive_loss": 2.856095314025879, "train/negative_loss": 1.8790549039840698, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.9770404696464539, "train/total_loss": 0.804239809513092 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.16038738191127777, "train/contrastive_loss": 2.011524200439453, "train/negative_loss": 0.7170014977455139, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.294522762298584, "train/total_loss": 0.5626922249794006 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.1599067747592926, "train/contrastive_loss": 5.245911121368408, "train/negative_loss": 5.245909690856934, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 1.5854857338126749e-06, "train/total_loss": 1.2090890407562256 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.16568949818611145, "train/contrastive_loss": 0.7083851099014282, "train/negative_loss": 0.4586718678474426, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.2497132271528244, "train/total_loss": 0.3073665201663971 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.21125702559947968, "train/contrastive_loss": 2.7015156745910645, "train/negative_loss": 1.6683448553085327, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0331707000732422, "train/total_loss": 0.7515602111816406 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.16208994388580322, "train/contrastive_loss": 2.0591349601745605, "train/negative_loss": 0.8783535957336426, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.1807812452316284, "train/total_loss": 0.5739169120788574 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.26127591729164124, "train/contrastive_loss": 1.510298252105713, "train/negative_loss": 1.1916983127593994, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.31859999895095825, "train/total_loss": 0.5633355379104614 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.16329923272132874, "train/contrastive_loss": 1.3590660095214844, "train/negative_loss": 0.9801003336906433, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.37896573543548584, "train/total_loss": 0.43511244654655457 }, { "epoch": 10.211267605633802, "eval_exact_match_accuracy": 0.32275132275132273, "eval_hamming_loss": 0.06463326071169208, "eval_loss": 0.5829338431358337, "eval_macro_f1": 0.4351002757555069, "eval_macro_precision": 0.6404843330845489, "eval_macro_recall": 0.3521258198223301, "eval_micro_f1": 0.5787694388100068, "eval_micro_precision": 0.7911275415896488, "eval_micro_recall": 0.4562899786780384, "eval_runtime": 2.8488, "eval_samples_per_second": 199.031, "eval_steps_per_second": 24.923, "step": 2900 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.10593006759881973, "train/contrastive_loss": 0.6669097542762756, "train/negative_loss": 0.6588942408561707, "train/num_negatives": 36, "train/num_positives": 20, "train/positive_loss": 0.008015519939363003, "train/total_loss": 0.23931202292442322 }, { "epoch": 10.211267605633802, "step": 2900, "train/classification_loss": 0.14086495339870453, "train/contrastive_loss": 1.5772793292999268, "train/negative_loss": 1.271799087524414, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 0.3054801821708679, "train/total_loss": 0.4563208222389221 }, { "epoch": 10.387323943661972, "grad_norm": 14.002019882202148, "learning_rate": 1.9598872445384076e-05, "loss": 0.6253, "step": 2950 }, { "epoch": 10.387323943661972, "step": 2950, "train/classification_loss": 0.07413940131664276, "train/contrastive_loss": 0.1552697718143463, "train/negative_loss": 0.13997884094715118, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.015290931798517704, "train/total_loss": 0.1051933541893959 }, { "epoch": 10.387323943661972, "step": 2950, "train/classification_loss": 0.1367824524641037, "train/contrastive_loss": 0.5186465978622437, "train/negative_loss": 0.5146605968475342, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.00398603081703186, "train/total_loss": 0.24051177501678467 }, { "epoch": 10.56338028169014, "grad_norm": 11.690299987792969, "learning_rate": 1.9591825229034534e-05, "loss": 0.6032, "step": 3000 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.2762620747089386, "train/contrastive_loss": 2.3873162269592285, "train/negative_loss": 1.5687317848205566, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.8185845613479614, "train/total_loss": 0.7537252902984619 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.25543755292892456, "train/contrastive_loss": 1.2461047172546387, "train/negative_loss": 0.472343385219574, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.7737613916397095, "train/total_loss": 0.5046585202217102 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.23958174884319305, "train/contrastive_loss": 2.76216459274292, "train/negative_loss": 1.3364864587783813, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.425678014755249, "train/total_loss": 0.7920147180557251 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.16245520114898682, "train/contrastive_loss": 2.3808512687683105, "train/negative_loss": 1.7466623783111572, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.6341889500617981, "train/total_loss": 0.6386255025863647 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.2083040475845337, "train/contrastive_loss": 2.8997902870178223, "train/negative_loss": 2.8517308235168457, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.04805942624807358, "train/total_loss": 0.788262128829956 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.20814986526966095, "train/contrastive_loss": 2.683485507965088, "train/negative_loss": 1.347381591796875, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.3361037969589233, "train/total_loss": 0.7448469400405884 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.19245050847530365, "train/contrastive_loss": 2.4646382331848145, "train/negative_loss": 1.1738001108169556, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.2908380031585693, "train/total_loss": 0.6853781342506409 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.19908642768859863, "train/contrastive_loss": 1.0945513248443604, "train/negative_loss": 1.0945110321044922, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 4.0293551137438044e-05, "train/total_loss": 0.41799670457839966 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.10663730651140213, "train/contrastive_loss": 0.43518689274787903, "train/negative_loss": 0.4090810716152191, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.02610582672059536, "train/total_loss": 0.19367468357086182 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1675368696451187, "train/contrastive_loss": 1.748020887374878, "train/negative_loss": 0.7628961801528931, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.9851246476173401, "train/total_loss": 0.5171410441398621 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1484692394733429, "train/contrastive_loss": 1.2832281589508057, "train/negative_loss": 0.8856143951416016, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.3976137340068817, "train/total_loss": 0.40511488914489746 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.15774308145046234, "train/contrastive_loss": 1.4628280401229858, "train/negative_loss": 1.3172005414962769, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.14562752842903137, "train/total_loss": 0.4503086805343628 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.20536047220230103, "train/contrastive_loss": 3.2447919845581055, "train/negative_loss": 1.9048564434051514, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.339935541152954, "train/total_loss": 0.8543188571929932 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1619938760995865, "train/contrastive_loss": 1.0439677238464355, "train/negative_loss": 0.6946704983711243, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.34929725527763367, "train/total_loss": 0.37078744173049927 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.14412476122379303, "train/contrastive_loss": 3.019122838973999, "train/negative_loss": 0.9273945689201355, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.0917282104492188, "train/total_loss": 0.7479493021965027 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1468760371208191, "train/contrastive_loss": 0.5179504752159119, "train/negative_loss": 0.37436434626579285, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.14358612895011902, "train/total_loss": 0.25046613812446594 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.11221809685230255, "train/contrastive_loss": 0.8565540313720703, "train/negative_loss": 0.5195607542991638, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.3369932770729065, "train/total_loss": 0.2835289239883423 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1688118875026703, "train/contrastive_loss": 0.9327883720397949, "train/negative_loss": 0.3360637128353119, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.5967246294021606, "train/total_loss": 0.35536956787109375 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.15971487760543823, "train/contrastive_loss": 2.3112308979034424, "train/negative_loss": 0.8913699984550476, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 1.4198609590530396, "train/total_loss": 0.6219610571861267 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.21708834171295166, "train/contrastive_loss": 3.3200504779815674, "train/negative_loss": 1.1901757717132568, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.1298747062683105, "train/total_loss": 0.8810984492301941 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1149444729089737, "train/contrastive_loss": 1.7186161279678345, "train/negative_loss": 1.7137479782104492, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.004868112504482269, "train/total_loss": 0.45866769552230835 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.13831518590450287, "train/contrastive_loss": 3.3318591117858887, "train/negative_loss": 2.577338218688965, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.7545210123062134, "train/total_loss": 0.8046870231628418 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.14285585284233093, "train/contrastive_loss": 1.9449069499969482, "train/negative_loss": 0.8926212787628174, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 1.0522856712341309, "train/total_loss": 0.5318372249603271 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.23551133275032043, "train/contrastive_loss": 2.9736928939819336, "train/negative_loss": 1.9470629692077637, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.02662992477417, "train/total_loss": 0.8302499055862427 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1685134321451187, "train/contrastive_loss": 2.478376865386963, "train/negative_loss": 1.3601411581039429, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.11823570728302, "train/total_loss": 0.664188802242279 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.2670794427394867, "train/contrastive_loss": 3.8331222534179688, "train/negative_loss": 2.744384765625, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0887373685836792, "train/total_loss": 1.0337039232254028 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1832488775253296, "train/contrastive_loss": 2.2549726963043213, "train/negative_loss": 2.2538952827453613, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.001077397377230227, "train/total_loss": 0.6342434287071228 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.2047833800315857, "train/contrastive_loss": 1.1822214126586914, "train/negative_loss": 1.1603710651397705, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.021850330755114555, "train/total_loss": 0.44122767448425293 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.2744237780570984, "train/contrastive_loss": 3.28920841217041, "train/negative_loss": 1.2559646368026733, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 2.0332438945770264, "train/total_loss": 0.9322654604911804 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.18878227472305298, "train/contrastive_loss": 0.6206185817718506, "train/negative_loss": 0.6101956367492676, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.01042292919009924, "train/total_loss": 0.3129059970378876 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.18836022913455963, "train/contrastive_loss": 1.750382423400879, "train/negative_loss": 1.3351140022277832, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.4152684807777405, "train/total_loss": 0.5384367108345032 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1622367799282074, "train/contrastive_loss": 3.5931925773620605, "train/negative_loss": 2.5476036071777344, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.0455890893936157, "train/total_loss": 0.8808753490447998 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1841551810503006, "train/contrastive_loss": 1.511103868484497, "train/negative_loss": 0.9502866864204407, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.5608171820640564, "train/total_loss": 0.48637598752975464 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.26156654953956604, "train/contrastive_loss": 2.263023853302002, "train/negative_loss": 1.9572700262069702, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.3057537078857422, "train/total_loss": 0.714171290397644 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.2191566675901413, "train/contrastive_loss": 1.6404569149017334, "train/negative_loss": 0.8151454925537109, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.8253113627433777, "train/total_loss": 0.5472480654716492 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.16641321778297424, "train/contrastive_loss": 3.6082730293273926, "train/negative_loss": 3.6082630157470703, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 9.928638974088244e-06, "train/total_loss": 0.8880678415298462 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.21078330278396606, "train/contrastive_loss": 2.788423538208008, "train/negative_loss": 0.8298013806343079, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 1.9586220979690552, "train/total_loss": 0.7684680223464966 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.22494281828403473, "train/contrastive_loss": 3.441727638244629, "train/negative_loss": 2.8914742469787598, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.5502535104751587, "train/total_loss": 0.9132883548736572 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.2436332106590271, "train/contrastive_loss": 0.7654647827148438, "train/negative_loss": 0.2511307895183563, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.5143340229988098, "train/total_loss": 0.39672619104385376 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.29328644275665283, "train/contrastive_loss": 4.5129265785217285, "train/negative_loss": 1.815167784690857, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.697758674621582, "train/total_loss": 1.1958718299865723 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.18113462626934052, "train/contrastive_loss": 2.5789456367492676, "train/negative_loss": 1.396188497543335, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.182757019996643, "train/total_loss": 0.6969237923622131 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1820196807384491, "train/contrastive_loss": 1.809961199760437, "train/negative_loss": 1.4282125234603882, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.38174864649772644, "train/total_loss": 0.5440119504928589 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.17479562759399414, "train/contrastive_loss": 0.9607092142105103, "train/negative_loss": 0.9605926275253296, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.00011656926653813571, "train/total_loss": 0.36693745851516724 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.2636986970901489, "train/contrastive_loss": 2.545609951019287, "train/negative_loss": 1.4108635187149048, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.1347464323043823, "train/total_loss": 0.7728207111358643 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.17134632170200348, "train/contrastive_loss": 1.4071953296661377, "train/negative_loss": 0.769248902797699, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.6379464864730835, "train/total_loss": 0.4527853727340698 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.3339294493198395, "train/contrastive_loss": 2.163451671600342, "train/negative_loss": 0.8712236881256104, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.292227864265442, "train/total_loss": 0.7666198015213013 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.13371475040912628, "train/contrastive_loss": 2.418879985809326, "train/negative_loss": 0.6593396067619324, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.759540319442749, "train/total_loss": 0.6174907684326172 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.18897037208080292, "train/contrastive_loss": 3.7722811698913574, "train/negative_loss": 3.054877281188965, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.7174040079116821, "train/total_loss": 0.9434266090393066 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.2586095929145813, "train/contrastive_loss": 2.0080924034118652, "train/negative_loss": 2.008091449737549, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 9.536747711536009e-07, "train/total_loss": 0.6602280735969543 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.19155491888523102, "train/contrastive_loss": 2.808267831802368, "train/negative_loss": 1.588202953338623, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.2200648784637451, "train/total_loss": 0.7532084584236145 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.11223132163286209, "train/contrastive_loss": 0.18879052996635437, "train/negative_loss": 0.1261802464723587, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.06261028349399567, "train/total_loss": 0.14998942613601685 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.18023742735385895, "train/contrastive_loss": 0.8828045129776001, "train/negative_loss": 0.8595558404922485, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.023248683661222458, "train/total_loss": 0.35679835081100464 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.19564281404018402, "train/contrastive_loss": 1.6861006021499634, "train/negative_loss": 1.5358744859695435, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.1502261459827423, "train/total_loss": 0.5328629612922668 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.30229437351226807, "train/contrastive_loss": 2.5030159950256348, "train/negative_loss": 1.3248379230499268, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.178178071975708, "train/total_loss": 0.802897572517395 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.14517316222190857, "train/contrastive_loss": 1.179174542427063, "train/negative_loss": 1.0594836473464966, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.11969085782766342, "train/total_loss": 0.3810080885887146 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.13750970363616943, "train/contrastive_loss": 0.7566724419593811, "train/negative_loss": 0.3975960314273834, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.3590764105319977, "train/total_loss": 0.28884419798851013 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.16646422445774078, "train/contrastive_loss": 2.040703773498535, "train/negative_loss": 1.0129212141036987, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.0277825593948364, "train/total_loss": 0.5746049880981445 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.20582664012908936, "train/contrastive_loss": 4.210188388824463, "train/negative_loss": 1.2171884775161743, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 2.993000030517578, "train/total_loss": 1.047864317893982 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.19206711649894714, "train/contrastive_loss": 1.3858373165130615, "train/negative_loss": 0.7494128346443176, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.6364244818687439, "train/total_loss": 0.4692345857620239 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.10709568113088608, "train/contrastive_loss": 0.725210964679718, "train/negative_loss": 0.7208110690116882, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.004399867728352547, "train/total_loss": 0.2521378695964813 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1921747773885727, "train/contrastive_loss": 2.197178840637207, "train/negative_loss": 1.372187614440918, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.8249912261962891, "train/total_loss": 0.6316105723381042 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.23746086657047272, "train/contrastive_loss": 1.5042730569839478, "train/negative_loss": 1.3201839923858643, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.18408910930156708, "train/total_loss": 0.53831547498703 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.15973779559135437, "train/contrastive_loss": 2.2139954566955566, "train/negative_loss": 1.3080657720565796, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.9059298038482666, "train/total_loss": 0.6025369167327881 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.18993617594242096, "train/contrastive_loss": 1.3275916576385498, "train/negative_loss": 0.9583486914634705, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.36924299597740173, "train/total_loss": 0.4554545283317566 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.17862918972969055, "train/contrastive_loss": 2.797597885131836, "train/negative_loss": 0.7121429443359375, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 2.0854549407958984, "train/total_loss": 0.7381488084793091 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.14451172947883606, "train/contrastive_loss": 3.5993711948394775, "train/negative_loss": 3.5993692874908447, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 1.835825969465077e-06, "train/total_loss": 0.8643859624862671 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.15485413372516632, "train/contrastive_loss": 0.5619473457336426, "train/negative_loss": 0.354228138923645, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.20771919190883636, "train/total_loss": 0.2672435939311981 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.20139886438846588, "train/contrastive_loss": 2.9238600730895996, "train/negative_loss": 1.357291579246521, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.566568374633789, "train/total_loss": 0.7861708998680115 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.1958179622888565, "train/contrastive_loss": 2.95369553565979, "train/negative_loss": 1.2270042896270752, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.7266912460327148, "train/total_loss": 0.7865570783615112 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.25784116983413696, "train/contrastive_loss": 2.2676851749420166, "train/negative_loss": 1.1066980361938477, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.160987138748169, "train/total_loss": 0.7113782167434692 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.16992880403995514, "train/contrastive_loss": 0.767574667930603, "train/negative_loss": 0.7672322988510132, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.0003423854650463909, "train/total_loss": 0.323443740606308 }, { "epoch": 10.56338028169014, "eval_exact_match_accuracy": 0.30687830687830686, "eval_hamming_loss": 0.06867932358128437, "eval_loss": 0.6113051176071167, "eval_macro_f1": 0.39493366640337385, "eval_macro_precision": 0.6247004748047559, "eval_macro_recall": 0.31731720981631967, "eval_micro_f1": 0.5520974289580515, "eval_micro_precision": 0.7555555555555555, "eval_micro_recall": 0.4349680170575693, "eval_runtime": 2.8624, "eval_samples_per_second": 198.085, "eval_steps_per_second": 24.804, "step": 3000 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.13586701452732086, "train/contrastive_loss": 0.9734164476394653, "train/negative_loss": 0.7267447710037231, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.2466716766357422, "train/total_loss": 0.33055031299591064 }, { "epoch": 10.56338028169014, "step": 3000, "train/classification_loss": 0.22636692225933075, "train/contrastive_loss": 1.1001310348510742, "train/negative_loss": 0.4253845810890198, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.6747464537620544, "train/total_loss": 0.44639313220977783 }, { "epoch": 10.73943661971831, "grad_norm": 8.174198150634766, "learning_rate": 1.958477801268499e-05, "loss": 0.6474, "step": 3050 }, { "epoch": 10.73943661971831, "step": 3050, "train/classification_loss": 0.09077351540327072, "train/contrastive_loss": 1.7142343521118164, "train/negative_loss": 1.6784005165100098, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.03583380579948425, "train/total_loss": 0.4336203932762146 }, { "epoch": 10.73943661971831, "step": 3050, "train/classification_loss": 0.17790691554546356, "train/contrastive_loss": 0.7195115089416504, "train/negative_loss": 0.2735605835914612, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.4459509253501892, "train/total_loss": 0.32180923223495483 }, { "epoch": 10.915492957746478, "grad_norm": 22.022693634033203, "learning_rate": 1.957773079633545e-05, "loss": 0.5927, "step": 3100 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.2864118814468384, "train/contrastive_loss": 1.887838363647461, "train/negative_loss": 1.645249605178833, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.24258872866630554, "train/total_loss": 0.6639795303344727 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.24336405098438263, "train/contrastive_loss": 1.0732638835906982, "train/negative_loss": 0.5296627283096313, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.5436012148857117, "train/total_loss": 0.4580168128013611 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.24337171018123627, "train/contrastive_loss": 3.356455087661743, "train/negative_loss": 1.7600804567337036, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.5963746309280396, "train/total_loss": 0.914662778377533 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.18461358547210693, "train/contrastive_loss": 3.4242005348205566, "train/negative_loss": 2.0972795486450195, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.3269211053848267, "train/total_loss": 0.8694537281990051 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.1745333969593048, "train/contrastive_loss": 2.0744104385375977, "train/negative_loss": 1.5164457559585571, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.5579646229743958, "train/total_loss": 0.5894154906272888 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.2251957356929779, "train/contrastive_loss": 2.4608092308044434, "train/negative_loss": 1.6046676635742188, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.8561415076255798, "train/total_loss": 0.7173575758934021 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.18051719665527344, "train/contrastive_loss": 1.5304803848266602, "train/negative_loss": 0.7692257761955261, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.761254608631134, "train/total_loss": 0.48661327362060547 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.16268013417720795, "train/contrastive_loss": 0.45500245690345764, "train/negative_loss": 0.4549833834171295, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 1.9073668227065355e-05, "train/total_loss": 0.25368061661720276 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.1237364113330841, "train/contrastive_loss": 2.254930257797241, "train/negative_loss": 0.9909666776657104, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.2639635801315308, "train/total_loss": 0.5747224688529968 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.16575469076633453, "train/contrastive_loss": 1.8757065534591675, "train/negative_loss": 1.4117900133132935, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.463916540145874, "train/total_loss": 0.5408959984779358 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.13043059408664703, "train/contrastive_loss": 1.236993432044983, "train/negative_loss": 0.379549115896225, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.8574442863464355, "train/total_loss": 0.37782928347587585 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.17029546201229095, "train/contrastive_loss": 2.510523796081543, "train/negative_loss": 1.636656403541565, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.8738675117492676, "train/total_loss": 0.6724002361297607 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.21521975100040436, "train/contrastive_loss": 3.4830446243286133, "train/negative_loss": 1.8847639560699463, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.598280668258667, "train/total_loss": 0.9118286967277527 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.15509048104286194, "train/contrastive_loss": 1.3517342805862427, "train/negative_loss": 0.742401659488678, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.6093326210975647, "train/total_loss": 0.425437331199646 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.12977679073810577, "train/contrastive_loss": 2.0522046089172363, "train/negative_loss": 0.5493854880332947, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.5028190612792969, "train/total_loss": 0.5402176976203918 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.16477005183696747, "train/contrastive_loss": 1.2424614429473877, "train/negative_loss": 0.30191347002983093, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.9405479431152344, "train/total_loss": 0.41326233744621277 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.1339196115732193, "train/contrastive_loss": 1.1581369638442993, "train/negative_loss": 0.12770843505859375, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.0304285287857056, "train/total_loss": 0.3655470013618469 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.19022709131240845, "train/contrastive_loss": 1.423992395401001, "train/negative_loss": 0.4855671226978302, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.9384252429008484, "train/total_loss": 0.47502556443214417 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.1645231544971466, "train/contrastive_loss": 1.8002641201019287, "train/negative_loss": 0.862368106842041, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.9378959536552429, "train/total_loss": 0.52457594871521 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.20813487470149994, "train/contrastive_loss": 3.664506673812866, "train/negative_loss": 1.383126974105835, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.2813796997070312, "train/total_loss": 0.9410362243652344 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.11586124449968338, "train/contrastive_loss": 1.495785117149353, "train/negative_loss": 1.4938901662826538, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.00189495540689677, "train/total_loss": 0.4150182604789734 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.11913207173347473, "train/contrastive_loss": 2.461695909500122, "train/negative_loss": 1.6116716861724854, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8500242233276367, "train/total_loss": 0.6114712953567505 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.16245511174201965, "train/contrastive_loss": 2.0862247943878174, "train/negative_loss": 2.040592670440674, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.04563206061720848, "train/total_loss": 0.5797001123428345 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.28559696674346924, "train/contrastive_loss": 2.0909156799316406, "train/negative_loss": 1.271106243133545, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.8198093175888062, "train/total_loss": 0.7037801146507263 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.1815870702266693, "train/contrastive_loss": 2.731168031692505, "train/negative_loss": 0.738377034664154, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.9927910566329956, "train/total_loss": 0.727820634841919 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.19949638843536377, "train/contrastive_loss": 2.3821473121643066, "train/negative_loss": 1.4946497678756714, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8874974846839905, "train/total_loss": 0.6759258508682251 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.18911835551261902, "train/contrastive_loss": 3.349832534790039, "train/negative_loss": 1.8693777322769165, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 1.480454921722412, "train/total_loss": 0.8590848445892334 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.17546650767326355, "train/contrastive_loss": 0.23197080194950104, "train/negative_loss": 0.16607673466205597, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.06589406728744507, "train/total_loss": 0.22186067700386047 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.2607475817203522, "train/contrastive_loss": 2.7584080696105957, "train/negative_loss": 1.547375202178955, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.211032748222351, "train/total_loss": 0.8124291896820068 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.18682272732257843, "train/contrastive_loss": 0.9725147485733032, "train/negative_loss": 0.9686235189437866, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0038912203162908554, "train/total_loss": 0.3813256621360779 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.15884801745414734, "train/contrastive_loss": 1.14173424243927, "train/negative_loss": 1.0859134197235107, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.05582084506750107, "train/total_loss": 0.3871948719024658 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.1540917456150055, "train/contrastive_loss": 1.5852687358856201, "train/negative_loss": 1.068734884262085, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.5165338516235352, "train/total_loss": 0.47114551067352295 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.18662399053573608, "train/contrastive_loss": 1.9513202905654907, "train/negative_loss": 1.1811792850494385, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.7701410055160522, "train/total_loss": 0.5768880844116211 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.21067319810390472, "train/contrastive_loss": 2.445605754852295, "train/negative_loss": 1.8993991613388062, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.5462064743041992, "train/total_loss": 0.699794352054596 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.21469761431217194, "train/contrastive_loss": 2.5030813217163086, "train/negative_loss": 1.2699363231658936, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.2331451177597046, "train/total_loss": 0.7153138518333435 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.13888822495937347, "train/contrastive_loss": 1.0031150579452515, "train/negative_loss": 0.9300569891929626, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.07305808365345001, "train/total_loss": 0.3395112454891205 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.18932612240314484, "train/contrastive_loss": 2.515317440032959, "train/negative_loss": 0.7715743780136108, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 1.7437431812286377, "train/total_loss": 0.6923896074295044 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.23474206030368805, "train/contrastive_loss": 2.8058667182922363, "train/negative_loss": 2.665243148803711, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.14062350988388062, "train/total_loss": 0.795915424823761 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.2089659720659256, "train/contrastive_loss": 1.217363715171814, "train/negative_loss": 0.5548285841941833, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.6625351309776306, "train/total_loss": 0.45243871212005615 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.2850220501422882, "train/contrastive_loss": 4.733141899108887, "train/negative_loss": 2.235766887664795, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.497375011444092, "train/total_loss": 1.231650471687317 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.13214343786239624, "train/contrastive_loss": 0.8666453957557678, "train/negative_loss": 0.6629396677017212, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.20370574295520782, "train/total_loss": 0.3054725229740143 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.1611281782388687, "train/contrastive_loss": 1.518791913986206, "train/negative_loss": 1.1376475095748901, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.3811444342136383, "train/total_loss": 0.46488654613494873 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.15202417969703674, "train/contrastive_loss": 0.5903093218803406, "train/negative_loss": 0.5901009440422058, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.00020837149349972606, "train/total_loss": 0.27008605003356934 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.238716259598732, "train/contrastive_loss": 0.6789034605026245, "train/negative_loss": 0.6504549980163574, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.02844846621155739, "train/total_loss": 0.3744969367980957 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.15262065827846527, "train/contrastive_loss": 0.8248007893562317, "train/negative_loss": 0.7848192453384399, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.03998157009482384, "train/total_loss": 0.31758081912994385 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.33645617961883545, "train/contrastive_loss": 2.646329402923584, "train/negative_loss": 1.732357144355774, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.9139721393585205, "train/total_loss": 0.8657220602035522 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.13383379578590393, "train/contrastive_loss": 2.0540456771850586, "train/negative_loss": 1.0507713556289673, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.0032742023468018, "train/total_loss": 0.5446429252624512 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.17278072237968445, "train/contrastive_loss": 1.8779497146606445, "train/negative_loss": 1.5615594387054443, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.31639033555984497, "train/total_loss": 0.5483706593513489 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.303207665681839, "train/contrastive_loss": 2.935037612915039, "train/negative_loss": 2.9350357055664062, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 1.7881409348774469e-06, "train/total_loss": 0.8902151584625244 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.21228420734405518, "train/contrastive_loss": 2.569387435913086, "train/negative_loss": 1.3032070398330688, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.2661805152893066, "train/total_loss": 0.7261617183685303 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.12310808151960373, "train/contrastive_loss": 0.2326999306678772, "train/negative_loss": 0.07561866194009781, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.1570812612771988, "train/total_loss": 0.16964806616306305 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.21158453822135925, "train/contrastive_loss": 1.064109444618225, "train/negative_loss": 1.003908395767212, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.06020107865333557, "train/total_loss": 0.42440640926361084 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.18313325941562653, "train/contrastive_loss": 1.17430579662323, "train/negative_loss": 0.9207723736763, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.25353342294692993, "train/total_loss": 0.4179944396018982 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.3142702877521515, "train/contrastive_loss": 4.130368232727051, "train/negative_loss": 1.5191065073013306, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 2.6112618446350098, "train/total_loss": 1.1403439044952393 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.1566716879606247, "train/contrastive_loss": 1.673736333847046, "train/negative_loss": 0.4677121937274933, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.206024169921875, "train/total_loss": 0.4914189577102661 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.12629804015159607, "train/contrastive_loss": 0.620015025138855, "train/negative_loss": 0.36873212456703186, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.2512829005718231, "train/total_loss": 0.2503010630607605 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.14527374505996704, "train/contrastive_loss": 0.9354717135429382, "train/negative_loss": 0.612289309501648, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.3231824040412903, "train/total_loss": 0.33236807584762573 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.2021377980709076, "train/contrastive_loss": 2.8250555992126465, "train/negative_loss": 1.6179020404815674, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.207153558731079, "train/total_loss": 0.7671489715576172 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.19269733130931854, "train/contrastive_loss": 0.7300717830657959, "train/negative_loss": 0.20723435282707214, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.5228374004364014, "train/total_loss": 0.338711678981781 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.08335969597101212, "train/contrastive_loss": 0.19011488556861877, "train/negative_loss": 0.16568341851234436, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.024431472644209862, "train/total_loss": 0.12138266861438751 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.20223596692085266, "train/contrastive_loss": 2.590609073638916, "train/negative_loss": 1.370938777923584, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 1.2196701765060425, "train/total_loss": 0.7203577756881714 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.1792982667684555, "train/contrastive_loss": 0.8562071323394775, "train/negative_loss": 0.8168087005615234, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.03939841687679291, "train/total_loss": 0.3505396842956543 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.13246937096118927, "train/contrastive_loss": 1.981392502784729, "train/negative_loss": 0.9428377151489258, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.0385547876358032, "train/total_loss": 0.5287478566169739 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.20984430611133575, "train/contrastive_loss": 2.0217764377593994, "train/negative_loss": 0.9913319945335388, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.0304443836212158, "train/total_loss": 0.6141995787620544 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.1769595444202423, "train/contrastive_loss": 2.7295522689819336, "train/negative_loss": 0.8510855436325073, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.8784666061401367, "train/total_loss": 0.7228699922561646 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.13547709584236145, "train/contrastive_loss": 2.775662660598755, "train/negative_loss": 2.7756612300872803, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 1.370908194076037e-06, "train/total_loss": 0.6906096935272217 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.16970960795879364, "train/contrastive_loss": 0.7779986262321472, "train/negative_loss": 0.5800029635429382, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.19799566268920898, "train/total_loss": 0.3253093361854553 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.21894241869449615, "train/contrastive_loss": 2.8856682777404785, "train/negative_loss": 1.7207978963851929, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.1648703813552856, "train/total_loss": 0.7960760593414307 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.14858795702457428, "train/contrastive_loss": 1.9505035877227783, "train/negative_loss": 0.8634089827537537, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.0870946645736694, "train/total_loss": 0.5386886596679688 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.28609156608581543, "train/contrastive_loss": 2.2845277786254883, "train/negative_loss": 1.8844904899597168, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.40003716945648193, "train/total_loss": 0.7429971694946289 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.14781293272972107, "train/contrastive_loss": 0.9626945853233337, "train/negative_loss": 0.8595737814903259, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.103120818734169, "train/total_loss": 0.3403518497943878 }, { "epoch": 10.915492957746478, "eval_exact_match_accuracy": 0.30158730158730157, "eval_hamming_loss": 0.06608569353667393, "eval_loss": 0.5665774941444397, "eval_macro_f1": 0.41538974594908723, "eval_macro_precision": 0.6422816414068047, "eval_macro_recall": 0.3289031447309365, "eval_micro_f1": 0.5542337298810357, "eval_micro_precision": 0.8065173116089613, "eval_micro_recall": 0.42217484008528783, "eval_runtime": 2.8429, "eval_samples_per_second": 199.446, "eval_steps_per_second": 24.975, "step": 3100 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.16276085376739502, "train/contrastive_loss": 1.175837516784668, "train/negative_loss": 0.42145830392837524, "train/num_negatives": 40, "train/num_positives": 6, "train/positive_loss": 0.754379153251648, "train/total_loss": 0.3979283571243286 }, { "epoch": 10.915492957746478, "step": 3100, "train/classification_loss": 0.0897907018661499, "train/contrastive_loss": 0.2587071359157562, "train/negative_loss": 0.19876466691493988, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.059942472726106644, "train/total_loss": 0.14153212308883667 }, { "epoch": 11.091549295774648, "grad_norm": 5.6430487632751465, "learning_rate": 1.9570683579985908e-05, "loss": 0.579, "step": 3150 }, { "epoch": 11.091549295774648, "step": 3150, "train/classification_loss": 0.12388253211975098, "train/contrastive_loss": 0.2602914869785309, "train/negative_loss": 0.25685280561447144, "train/num_negatives": 38, "train/num_positives": 18, "train/positive_loss": 0.00343866809271276, "train/total_loss": 0.17594082653522491 }, { "epoch": 11.091549295774648, "step": 3150, "train/classification_loss": 0.10799126327037811, "train/contrastive_loss": 0.43816837668418884, "train/negative_loss": 0.20483598113059998, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.23333239555358887, "train/total_loss": 0.1956249475479126 }, { "epoch": 11.267605633802816, "grad_norm": 4.246716022491455, "learning_rate": 1.9563636363636366e-05, "loss": 0.5639, "step": 3200 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.2657213509082794, "train/contrastive_loss": 2.4152140617370605, "train/negative_loss": 1.125178337097168, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.2900358438491821, "train/total_loss": 0.748764157295227 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.2557452321052551, "train/contrastive_loss": 0.7766358256340027, "train/negative_loss": 0.4335929751396179, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.34304285049438477, "train/total_loss": 0.41107240319252014 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.24305664002895355, "train/contrastive_loss": 2.6732258796691895, "train/negative_loss": 1.402230978012085, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 1.270994782447815, "train/total_loss": 0.7777018547058105 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.17530137300491333, "train/contrastive_loss": 2.785922050476074, "train/negative_loss": 2.2605278491973877, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5253943204879761, "train/total_loss": 0.7324857711791992 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.19417934119701385, "train/contrastive_loss": 2.4107208251953125, "train/negative_loss": 2.1431233882904053, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.267597496509552, "train/total_loss": 0.6763235330581665 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.2095743864774704, "train/contrastive_loss": 2.0488786697387695, "train/negative_loss": 1.1765451431274414, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.8723334074020386, "train/total_loss": 0.6193501353263855 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.1819399893283844, "train/contrastive_loss": 1.5255699157714844, "train/negative_loss": 0.6970598697662354, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.8285099864006042, "train/total_loss": 0.4870539903640747 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.18864093720912933, "train/contrastive_loss": 1.0019463300704956, "train/negative_loss": 1.0014688968658447, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.00047742793685756624, "train/total_loss": 0.38903021812438965 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.10362506657838821, "train/contrastive_loss": 0.5058585405349731, "train/negative_loss": 0.28313660621643066, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.22272193431854248, "train/total_loss": 0.20479677617549896 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.1796669065952301, "train/contrastive_loss": 2.56162428855896, "train/negative_loss": 1.7271939516067505, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.8344303369522095, "train/total_loss": 0.6919918060302734 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.14753808081150055, "train/contrastive_loss": 1.4757665395736694, "train/negative_loss": 0.9883856773376465, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.48738083243370056, "train/total_loss": 0.4426913857460022 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.16208414733409882, "train/contrastive_loss": 1.2481707334518433, "train/negative_loss": 1.0363537073135376, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.21181702613830566, "train/total_loss": 0.41171830892562866 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.19019164144992828, "train/contrastive_loss": 3.2874152660369873, "train/negative_loss": 1.6921882629394531, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.5952270030975342, "train/total_loss": 0.8476746678352356 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15533556044101715, "train/contrastive_loss": 1.011749505996704, "train/negative_loss": 0.698829174041748, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.3129202723503113, "train/total_loss": 0.3576854467391968 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.14520874619483948, "train/contrastive_loss": 2.6112098693847656, "train/negative_loss": 0.7664363980293274, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.844773530960083, "train/total_loss": 0.6674507856369019 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.14024148881435394, "train/contrastive_loss": 0.7283188104629517, "train/negative_loss": 0.2680666446685791, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.46025216579437256, "train/total_loss": 0.28590524196624756 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.11755108833312988, "train/contrastive_loss": 1.118392825126648, "train/negative_loss": 0.544413149356842, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5739796757698059, "train/total_loss": 0.3412296772003174 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.17467555403709412, "train/contrastive_loss": 1.3797621726989746, "train/negative_loss": 0.34697166085243225, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 1.0327905416488647, "train/total_loss": 0.45062798261642456 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15240579843521118, "train/contrastive_loss": 2.2916314601898193, "train/negative_loss": 1.2864196300506592, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 1.0052118301391602, "train/total_loss": 0.6107320785522461 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.22683919966220856, "train/contrastive_loss": 3.8062803745269775, "train/negative_loss": 1.1943809986114502, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.6118993759155273, "train/total_loss": 0.9880952835083008 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.1141100600361824, "train/contrastive_loss": 1.0588958263397217, "train/negative_loss": 1.0526171922683716, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.006278581917285919, "train/total_loss": 0.3258892297744751 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.1382991522550583, "train/contrastive_loss": 2.9155030250549316, "train/negative_loss": 2.0782766342163086, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8372265100479126, "train/total_loss": 0.7213997840881348 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.13700391352176666, "train/contrastive_loss": 1.6794188022613525, "train/negative_loss": 1.38852858543396, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.2908901572227478, "train/total_loss": 0.47288769483566284 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.22930797934532166, "train/contrastive_loss": 1.8620128631591797, "train/negative_loss": 1.4810782670974731, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.38093459606170654, "train/total_loss": 0.6017105579376221 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.16875040531158447, "train/contrastive_loss": 2.291365146636963, "train/negative_loss": 1.2841113805770874, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.007253646850586, "train/total_loss": 0.627023458480835 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.22738637030124664, "train/contrastive_loss": 3.314983606338501, "train/negative_loss": 2.4215595722198486, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8934239745140076, "train/total_loss": 0.8903830647468567 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.18316414952278137, "train/contrastive_loss": 1.8833078145980835, "train/negative_loss": 1.883018136024475, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.00028972988366149366, "train/total_loss": 0.5598257184028625 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.17130056023597717, "train/contrastive_loss": 0.2737555503845215, "train/negative_loss": 0.23766019940376282, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.03609533980488777, "train/total_loss": 0.2260516732931137 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.2610934376716614, "train/contrastive_loss": 2.8144679069519043, "train/negative_loss": 1.6672781705856323, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.147189736366272, "train/total_loss": 0.8239870071411133 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.18560656905174255, "train/contrastive_loss": 0.6844651103019714, "train/negative_loss": 0.6806688904762268, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.003796215867623687, "train/total_loss": 0.3224995732307434 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.17031270265579224, "train/contrastive_loss": 1.5365175008773804, "train/negative_loss": 1.4684834480285645, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.0680341050028801, "train/total_loss": 0.47761622071266174 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15797072649002075, "train/contrastive_loss": 2.588449478149414, "train/negative_loss": 2.09267258644104, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.4957770109176636, "train/total_loss": 0.6756606101989746 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.1835637092590332, "train/contrastive_loss": 1.3325707912445068, "train/negative_loss": 0.6118554472923279, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.7207152843475342, "train/total_loss": 0.4500778615474701 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.23642148077487946, "train/contrastive_loss": 2.7995941638946533, "train/negative_loss": 1.9201481342315674, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.8794460296630859, "train/total_loss": 0.79634028673172 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.23108001053333282, "train/contrastive_loss": 1.940598726272583, "train/negative_loss": 1.0866413116455078, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.8539574146270752, "train/total_loss": 0.6191997528076172 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15691709518432617, "train/contrastive_loss": 2.119863748550415, "train/negative_loss": 2.119856357574463, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 7.459197604475776e-06, "train/total_loss": 0.5808898210525513 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.19563058018684387, "train/contrastive_loss": 2.2068891525268555, "train/negative_loss": 0.7632665634155273, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 1.4436225891113281, "train/total_loss": 0.6370084285736084 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.23053982853889465, "train/contrastive_loss": 2.235748529434204, "train/negative_loss": 1.96981680393219, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.2659316658973694, "train/total_loss": 0.6776895523071289 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.2153698056936264, "train/contrastive_loss": 0.7962314486503601, "train/negative_loss": 0.3385002911090851, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.457731157541275, "train/total_loss": 0.3746160864830017 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.2736409604549408, "train/contrastive_loss": 4.180439472198486, "train/negative_loss": 1.5394563674926758, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.6409831047058105, "train/total_loss": 1.1097288131713867 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.1687142699956894, "train/contrastive_loss": 1.5914890766143799, "train/negative_loss": 1.19833505153656, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.3931540548801422, "train/total_loss": 0.4870120882987976 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.18804609775543213, "train/contrastive_loss": 2.65848708152771, "train/negative_loss": 1.5354578495025635, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.1230292320251465, "train/total_loss": 0.719743549823761 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15927208960056305, "train/contrastive_loss": 0.6541785001754761, "train/negative_loss": 0.6539868712425232, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0001916557375807315, "train/total_loss": 0.290107786655426 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.24697287380695343, "train/contrastive_loss": 0.8290350437164307, "train/negative_loss": 0.7988327145576477, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.03020232729613781, "train/total_loss": 0.41277986764907837 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15328232944011688, "train/contrastive_loss": 0.5345073342323303, "train/negative_loss": 0.525547444820404, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.008959909901022911, "train/total_loss": 0.26018381118774414 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.35116690397262573, "train/contrastive_loss": 2.0803022384643555, "train/negative_loss": 0.9331258535385132, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.1471765041351318, "train/total_loss": 0.7672273516654968 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.1320287138223648, "train/contrastive_loss": 2.4381017684936523, "train/negative_loss": 0.8239127397537231, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.6141890287399292, "train/total_loss": 0.6196490526199341 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.19773712754249573, "train/contrastive_loss": 3.7626452445983887, "train/negative_loss": 3.1881208419799805, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5745243430137634, "train/total_loss": 0.9502662420272827 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.28499636054039, "train/contrastive_loss": 2.309828042984009, "train/negative_loss": 2.309826612472534, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 1.3113030945532955e-06, "train/total_loss": 0.7469619512557983 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.196963831782341, "train/contrastive_loss": 3.1224212646484375, "train/negative_loss": 1.2401056289672852, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.8823156356811523, "train/total_loss": 0.8214480876922607 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.11312103271484375, "train/contrastive_loss": 0.1012469157576561, "train/negative_loss": 0.08254464715719223, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.018702266737818718, "train/total_loss": 0.13337041437625885 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.19312772154808044, "train/contrastive_loss": 0.7449637651443481, "train/negative_loss": 0.6785001158714294, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.06646361947059631, "train/total_loss": 0.3421204686164856 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.1988956779241562, "train/contrastive_loss": 1.525086760520935, "train/negative_loss": 1.246677041053772, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.2784097194671631, "train/total_loss": 0.5039130449295044 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.27779915928840637, "train/contrastive_loss": 2.391793966293335, "train/negative_loss": 0.9761002659797668, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.4156936407089233, "train/total_loss": 0.7561579942703247 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.1357644945383072, "train/contrastive_loss": 0.4140526056289673, "train/negative_loss": 0.22338993847370148, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.19066265225410461, "train/total_loss": 0.21857501566410065 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.12739631533622742, "train/contrastive_loss": 0.8716710805892944, "train/negative_loss": 0.6946232914924622, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.17704780399799347, "train/total_loss": 0.30173051357269287 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15808850526809692, "train/contrastive_loss": 2.0376715660095215, "train/negative_loss": 0.7465929388999939, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.2910786867141724, "train/total_loss": 0.5656228065490723 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.1801939159631729, "train/contrastive_loss": 2.3404970169067383, "train/negative_loss": 0.9966110587120056, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.343885898590088, "train/total_loss": 0.6482933163642883 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.19381454586982727, "train/contrastive_loss": 1.2143474817276, "train/negative_loss": 0.7627474665641785, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.45160001516342163, "train/total_loss": 0.4366840422153473 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.09656321257352829, "train/contrastive_loss": 0.42125219106674194, "train/negative_loss": 0.4189333915710449, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.0023188029881566763, "train/total_loss": 0.18081365525722504 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.19637297093868256, "train/contrastive_loss": 2.6825804710388184, "train/negative_loss": 1.944100260734558, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.738480269908905, "train/total_loss": 0.7328891158103943 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.22072051465511322, "train/contrastive_loss": 1.3003768920898438, "train/negative_loss": 1.2969356775283813, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.0034412278328090906, "train/total_loss": 0.4807959198951721 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15202614665031433, "train/contrastive_loss": 2.108879327774048, "train/negative_loss": 0.9631352424621582, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.1457440853118896, "train/total_loss": 0.5738019943237305 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.18210817873477936, "train/contrastive_loss": 1.1530498266220093, "train/negative_loss": 0.9356790781021118, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.21737070381641388, "train/total_loss": 0.41271814703941345 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.17568279802799225, "train/contrastive_loss": 2.3337693214416504, "train/negative_loss": 0.6237368583679199, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.71003258228302, "train/total_loss": 0.642436683177948 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15240773558616638, "train/contrastive_loss": 2.2747690677642822, "train/negative_loss": 2.2747669219970703, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 2.0265620150894392e-06, "train/total_loss": 0.6073615550994873 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15467776358127594, "train/contrastive_loss": 0.8875606060028076, "train/negative_loss": 0.38291463255882263, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.5046459436416626, "train/total_loss": 0.3321898877620697 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.2030763179063797, "train/contrastive_loss": 2.305759906768799, "train/negative_loss": 1.2035760879516602, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.1021839380264282, "train/total_loss": 0.6642283201217651 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.15912555158138275, "train/contrastive_loss": 1.9390206336975098, "train/negative_loss": 0.7214970588684082, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.2175235748291016, "train/total_loss": 0.546929657459259 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.26647865772247314, "train/contrastive_loss": 1.6334317922592163, "train/negative_loss": 1.2446074485778809, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.38882434368133545, "train/total_loss": 0.5931650400161743 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.17929764091968536, "train/contrastive_loss": 0.8770337700843811, "train/negative_loss": 0.8769389986991882, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 9.478629363002256e-05, "train/total_loss": 0.3547043800354004 }, { "epoch": 11.267605633802816, "eval_exact_match_accuracy": 0.30864197530864196, "eval_hamming_loss": 0.06753812636165578, "eval_loss": 0.5526972413063049, "eval_macro_f1": 0.41685994852399694, "eval_macro_precision": 0.5955618442810778, "eval_macro_recall": 0.3481723928585303, "eval_micro_f1": 0.5680159256801592, "eval_micro_precision": 0.7521968365553603, "eval_micro_recall": 0.4562899786780384, "eval_runtime": 2.8463, "eval_samples_per_second": 199.209, "eval_steps_per_second": 24.945, "step": 3200 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.20883125066757202, "train/contrastive_loss": 0.7995290756225586, "train/negative_loss": 0.5994036793708801, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.20012541115283966, "train/total_loss": 0.3687370717525482 }, { "epoch": 11.267605633802816, "step": 3200, "train/classification_loss": 0.08999417722225189, "train/contrastive_loss": 0.4491097927093506, "train/negative_loss": 0.44908660650253296, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.318649785593152e-05, "train/total_loss": 0.1798161268234253 }, { "epoch": 11.443661971830986, "grad_norm": 11.294279098510742, "learning_rate": 1.9556589147286824e-05, "loss": 0.564, "step": 3250 }, { "epoch": 11.443661971830986, "step": 3250, "train/classification_loss": 0.10319013148546219, "train/contrastive_loss": 0.5846144556999207, "train/negative_loss": 0.5358230471611023, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.04879140853881836, "train/total_loss": 0.22011302411556244 }, { "epoch": 11.443661971830986, "step": 3250, "train/classification_loss": 0.109939806163311, "train/contrastive_loss": 1.1497458219528198, "train/negative_loss": 1.0219770669937134, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.12776875495910645, "train/total_loss": 0.33988896012306213 }, { "epoch": 11.619718309859154, "grad_norm": 6.208378791809082, "learning_rate": 1.9549541930937282e-05, "loss": 0.5965, "step": 3300 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.271824449300766, "train/contrastive_loss": 2.7425999641418457, "train/negative_loss": 1.4797563552856445, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.2628434896469116, "train/total_loss": 0.8203444480895996 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2308635115623474, "train/contrastive_loss": 0.5782185792922974, "train/negative_loss": 0.40379682183265686, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.1744217574596405, "train/total_loss": 0.3465072214603424 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2390766143798828, "train/contrastive_loss": 2.477250099182129, "train/negative_loss": 1.5003087520599365, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.9769412875175476, "train/total_loss": 0.7345266342163086 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1614062339067459, "train/contrastive_loss": 2.4115052223205566, "train/negative_loss": 1.9254984855651855, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.48600685596466064, "train/total_loss": 0.643707275390625 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2126631736755371, "train/contrastive_loss": 2.995148181915283, "train/negative_loss": 2.3923137187957764, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.6028344631195068, "train/total_loss": 0.8116928339004517 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2108817845582962, "train/contrastive_loss": 2.171492099761963, "train/negative_loss": 1.3912353515625, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.7802567481994629, "train/total_loss": 0.6451802253723145 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.17042870819568634, "train/contrastive_loss": 1.3452556133270264, "train/negative_loss": 0.9358770847320557, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.4093785583972931, "train/total_loss": 0.4394798278808594 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.17551346123218536, "train/contrastive_loss": 1.0474576950073242, "train/negative_loss": 1.0466018915176392, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.000855811988003552, "train/total_loss": 0.38500499725341797 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.10680711269378662, "train/contrastive_loss": 0.8097406625747681, "train/negative_loss": 0.6321636438369751, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.17757698893547058, "train/total_loss": 0.2687552571296692 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.17906393110752106, "train/contrastive_loss": 3.3575968742370605, "train/negative_loss": 2.1975290775299072, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 1.1600677967071533, "train/total_loss": 0.8505833148956299 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.13731499016284943, "train/contrastive_loss": 1.4563870429992676, "train/negative_loss": 0.9088473916053772, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.5475396513938904, "train/total_loss": 0.42859238386154175 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1645163595676422, "train/contrastive_loss": 1.7096819877624512, "train/negative_loss": 1.533729076385498, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.1759529560804367, "train/total_loss": 0.5064527988433838 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.20296643674373627, "train/contrastive_loss": 3.4124557971954346, "train/negative_loss": 1.9307470321655273, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.4817087650299072, "train/total_loss": 0.8854576349258423 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.15907734632492065, "train/contrastive_loss": 1.0022470951080322, "train/negative_loss": 0.509635329246521, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.49261170625686646, "train/total_loss": 0.35952675342559814 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.13546057045459747, "train/contrastive_loss": 2.107813835144043, "train/negative_loss": 0.5898329019546509, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.5179810523986816, "train/total_loss": 0.5570233464241028 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.15548749268054962, "train/contrastive_loss": 0.6722891330718994, "train/negative_loss": 0.2584424316883087, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.4138466715812683, "train/total_loss": 0.2899453043937683 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.10703416913747787, "train/contrastive_loss": 1.0288366079330444, "train/negative_loss": 0.1696818321943283, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.8591547608375549, "train/total_loss": 0.3128014802932739 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.16292981803417206, "train/contrastive_loss": 1.232163906097412, "train/negative_loss": 0.3997874855995178, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.8323764801025391, "train/total_loss": 0.4093626141548157 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1506035178899765, "train/contrastive_loss": 1.4524778127670288, "train/negative_loss": 1.2619547843933105, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.19052301347255707, "train/total_loss": 0.4410991072654724 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.22428585588932037, "train/contrastive_loss": 2.6999354362487793, "train/negative_loss": 1.3738682270050049, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.3260670900344849, "train/total_loss": 0.764272928237915 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1076676994562149, "train/contrastive_loss": 1.0153857469558716, "train/negative_loss": 1.0031427145004272, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.012243022210896015, "train/total_loss": 0.31074485182762146 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.12680591642856598, "train/contrastive_loss": 2.765843629837036, "train/negative_loss": 1.9439961910247803, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8218474388122559, "train/total_loss": 0.6799746155738831 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.15786993503570557, "train/contrastive_loss": 2.2721447944641113, "train/negative_loss": 2.185723304748535, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.08642153441905975, "train/total_loss": 0.6122989058494568 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.22139698266983032, "train/contrastive_loss": 2.24672269821167, "train/negative_loss": 1.6440731287002563, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.602649450302124, "train/total_loss": 0.6707415580749512 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1993018537759781, "train/contrastive_loss": 3.190005302429199, "train/negative_loss": 1.3952195644378662, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.7947858572006226, "train/total_loss": 0.8373029232025146 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.23483437299728394, "train/contrastive_loss": 3.165469169616699, "train/negative_loss": 2.1562955379486084, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0091736316680908, "train/total_loss": 0.8679282069206238 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.17677053809165955, "train/contrastive_loss": 1.9858793020248413, "train/negative_loss": 1.9858514070510864, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 2.789558857330121e-05, "train/total_loss": 0.5739464163780212 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.17189553380012512, "train/contrastive_loss": 0.2384476512670517, "train/negative_loss": 0.22739988565444946, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.011047765612602234, "train/total_loss": 0.21958506107330322 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2899576425552368, "train/contrastive_loss": 2.3789281845092773, "train/negative_loss": 1.3426588773727417, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.036269187927246, "train/total_loss": 0.7657432556152344 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.16905038058757782, "train/contrastive_loss": 0.5521578788757324, "train/negative_loss": 0.545505702495575, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.0066522047854959965, "train/total_loss": 0.2794819474220276 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1666574478149414, "train/contrastive_loss": 1.482362985610962, "train/negative_loss": 1.4343078136444092, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.048055149614810944, "train/total_loss": 0.46313005685806274 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.16023311018943787, "train/contrastive_loss": 2.428905963897705, "train/negative_loss": 2.0511295795440674, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.37777647376060486, "train/total_loss": 0.6460143327713013 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.17652864754199982, "train/contrastive_loss": 0.7080708742141724, "train/negative_loss": 0.46254757046699524, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 0.24552331864833832, "train/total_loss": 0.318142831325531 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2224830836057663, "train/contrastive_loss": 2.6854300498962402, "train/negative_loss": 1.923003911972046, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.7624260783195496, "train/total_loss": 0.7595691084861755 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2267010658979416, "train/contrastive_loss": 1.255798101425171, "train/negative_loss": 0.6936713457107544, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.5621267557144165, "train/total_loss": 0.477860689163208 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1412009447813034, "train/contrastive_loss": 2.1248886585235596, "train/negative_loss": 2.124816656112671, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 7.192782504716888e-05, "train/total_loss": 0.5661786794662476 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.20716820657253265, "train/contrastive_loss": 1.4115493297576904, "train/negative_loss": 0.539827287197113, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 0.8717220425605774, "train/total_loss": 0.48947805166244507 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.23758310079574585, "train/contrastive_loss": 2.8222498893737793, "train/negative_loss": 2.2336480617523193, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.58860182762146, "train/total_loss": 0.8020330667495728 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1892024725675583, "train/contrastive_loss": 0.7085436582565308, "train/negative_loss": 0.4332088530063629, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.27533477544784546, "train/total_loss": 0.33091121912002563 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2605579197406769, "train/contrastive_loss": 3.3863043785095215, "train/negative_loss": 1.2728831768035889, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 2.1134212017059326, "train/total_loss": 0.9378187656402588 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.13022422790527344, "train/contrastive_loss": 0.8445090055465698, "train/negative_loss": 0.6096231937408447, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.23488584160804749, "train/total_loss": 0.2991260290145874 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1745436042547226, "train/contrastive_loss": 2.0638363361358643, "train/negative_loss": 1.2187228202819824, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.8451134562492371, "train/total_loss": 0.5873108506202698 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.16936448216438293, "train/contrastive_loss": 0.8729373216629028, "train/negative_loss": 0.8728799223899841, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 5.740164124290459e-05, "train/total_loss": 0.343951940536499 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2582992613315582, "train/contrastive_loss": 0.9566442966461182, "train/negative_loss": 0.7929278612136841, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.16371645033359528, "train/total_loss": 0.4496281147003174 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.15283633768558502, "train/contrastive_loss": 0.5042253136634827, "train/negative_loss": 0.4478946626186371, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.056330662220716476, "train/total_loss": 0.25368139147758484 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.3266153931617737, "train/contrastive_loss": 1.5614755153656006, "train/negative_loss": 0.4718243479728699, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 1.089651107788086, "train/total_loss": 0.6389105319976807 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.13703817129135132, "train/contrastive_loss": 2.47029185295105, "train/negative_loss": 0.7654306292533875, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.7048611640930176, "train/total_loss": 0.6310965418815613 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.19289667904376984, "train/contrastive_loss": 3.7196288108825684, "train/negative_loss": 3.216248035430908, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.5033808946609497, "train/total_loss": 0.9368224143981934 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.26242098212242126, "train/contrastive_loss": 3.1307640075683594, "train/negative_loss": 3.130762815475464, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 1.0728841743912199e-06, "train/total_loss": 0.8885737657546997 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.20656751096248627, "train/contrastive_loss": 2.8097095489501953, "train/negative_loss": 1.2043330669403076, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.6053763628005981, "train/total_loss": 0.7685094475746155 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.11084030568599701, "train/contrastive_loss": 0.1763785183429718, "train/negative_loss": 0.09339582920074463, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.08298268169164658, "train/total_loss": 0.14611601829528809 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.19506914913654327, "train/contrastive_loss": 0.9072536826133728, "train/negative_loss": 0.8548882603645325, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.05236539989709854, "train/total_loss": 0.3765198886394501 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.16868776082992554, "train/contrastive_loss": 1.4061518907546997, "train/negative_loss": 1.3938604593276978, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.012291480787098408, "train/total_loss": 0.44991815090179443 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2746620178222656, "train/contrastive_loss": 2.0092341899871826, "train/negative_loss": 0.8468360900878906, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 1.162398099899292, "train/total_loss": 0.676508903503418 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.13475558161735535, "train/contrastive_loss": 1.2681504487991333, "train/negative_loss": 0.4006800353527069, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.8674704432487488, "train/total_loss": 0.38838568329811096 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.11036793142557144, "train/contrastive_loss": 0.643263578414917, "train/negative_loss": 0.6143208742141724, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.028942694887518883, "train/total_loss": 0.23902064561843872 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.14527440071105957, "train/contrastive_loss": 1.371785283088684, "train/negative_loss": 0.796165406703949, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 0.5756198763847351, "train/total_loss": 0.4196314513683319 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.19375981390476227, "train/contrastive_loss": 3.0311942100524902, "train/negative_loss": 1.077102541923523, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 1.9540917873382568, "train/total_loss": 0.7999986410140991 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.17526721954345703, "train/contrastive_loss": 1.0896062850952148, "train/negative_loss": 0.7854379415512085, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.3041682839393616, "train/total_loss": 0.3931884765625 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.09320028126239777, "train/contrastive_loss": 0.17111603915691376, "train/negative_loss": 0.1276233047246933, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.04349273815751076, "train/total_loss": 0.127423495054245 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.20182648301124573, "train/contrastive_loss": 2.5402181148529053, "train/negative_loss": 1.9559324979782104, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.58428555727005, "train/total_loss": 0.7098701000213623 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.22756846249103546, "train/contrastive_loss": 1.5960291624069214, "train/negative_loss": 1.589327335357666, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.006701822858303785, "train/total_loss": 0.5467743277549744 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.158109650015831, "train/contrastive_loss": 1.5831613540649414, "train/negative_loss": 0.9915891289710999, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.5915722846984863, "train/total_loss": 0.47474193572998047 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.18724606931209564, "train/contrastive_loss": 1.3853458166122437, "train/negative_loss": 1.1623528003692627, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.22299300134181976, "train/total_loss": 0.4643152356147766 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.15005652606487274, "train/contrastive_loss": 1.6493808031082153, "train/negative_loss": 0.41411781311035156, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.2352629899978638, "train/total_loss": 0.47993266582489014 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1380922794342041, "train/contrastive_loss": 2.0614004135131836, "train/negative_loss": 2.0613982677459717, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 2.1100088360981317e-06, "train/total_loss": 0.5503723621368408 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.15814632177352905, "train/contrastive_loss": 1.2941360473632812, "train/negative_loss": 0.6059972643852234, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.6881387233734131, "train/total_loss": 0.4169735312461853 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.21540136635303497, "train/contrastive_loss": 2.395094633102417, "train/negative_loss": 1.565178632736206, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8299160599708557, "train/total_loss": 0.6944202780723572 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.14196059107780457, "train/contrastive_loss": 1.3686342239379883, "train/negative_loss": 0.527056872844696, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.841577410697937, "train/total_loss": 0.4156874418258667 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.2523321211338043, "train/contrastive_loss": 2.1039605140686035, "train/negative_loss": 1.7423510551452637, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.3616095781326294, "train/total_loss": 0.6731241941452026 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.16454818844795227, "train/contrastive_loss": 0.9493318200111389, "train/negative_loss": 0.9492660760879517, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 6.573570135515183e-05, "train/total_loss": 0.35441455245018005 }, { "epoch": 11.619718309859154, "eval_exact_match_accuracy": 0.31922398589065254, "eval_hamming_loss": 0.06608569353667393, "eval_loss": 0.5369996428489685, "eval_macro_f1": 0.4060723084250586, "eval_macro_precision": 0.6174204117921679, "eval_macro_recall": 0.33369223478544824, "eval_micro_f1": 0.5744822979291917, "eval_micro_precision": 0.7692307692307693, "eval_micro_recall": 0.4584221748400853, "eval_runtime": 2.8475, "eval_samples_per_second": 199.122, "eval_steps_per_second": 24.934, "step": 3300 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.1033724844455719, "train/contrastive_loss": 0.595157265663147, "train/negative_loss": 0.4263073801994324, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.168849915266037, "train/total_loss": 0.22240394353866577 }, { "epoch": 11.619718309859154, "step": 3300, "train/classification_loss": 0.09682909399271011, "train/contrastive_loss": 0.8690621256828308, "train/negative_loss": 0.8294048309326172, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.039657287299633026, "train/total_loss": 0.2706415355205536 }, { "epoch": 11.795774647887324, "grad_norm": 4.02087926864624, "learning_rate": 1.954249471458774e-05, "loss": 0.5413, "step": 3350 }, { "epoch": 11.795774647887324, "step": 3350, "train/classification_loss": 0.16480125486850739, "train/contrastive_loss": 0.21811242401599884, "train/negative_loss": 0.2180793583393097, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 3.306148573756218e-05, "train/total_loss": 0.20842373371124268 }, { "epoch": 11.795774647887324, "step": 3350, "train/classification_loss": 0.13820725679397583, "train/contrastive_loss": 1.0499615669250488, "train/negative_loss": 0.48286932706832886, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.56709223985672, "train/total_loss": 0.3481995761394501 }, { "epoch": 11.971830985915492, "grad_norm": 16.348533630371094, "learning_rate": 1.9535447498238198e-05, "loss": 0.5809, "step": 3400 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.2864153981208801, "train/contrastive_loss": 2.5060911178588867, "train/negative_loss": 1.3167080879211426, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.1893829107284546, "train/total_loss": 0.7876336574554443 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.2402697503566742, "train/contrastive_loss": 1.610914707183838, "train/negative_loss": 0.41657015681266785, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 1.1943445205688477, "train/total_loss": 0.5624526739120483 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.22807277739048004, "train/contrastive_loss": 1.9831628799438477, "train/negative_loss": 1.0569273233413696, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.9262354969978333, "train/total_loss": 0.6247053742408752 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.17550817131996155, "train/contrastive_loss": 2.4060754776000977, "train/negative_loss": 1.3238279819488525, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.0822473764419556, "train/total_loss": 0.6567232608795166 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.22617276012897491, "train/contrastive_loss": 2.8114664554595947, "train/negative_loss": 2.1197962760925293, "train/num_negatives": 34, "train/num_positives": 18, "train/positive_loss": 0.6916702389717102, "train/total_loss": 0.7884660363197327 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.22991156578063965, "train/contrastive_loss": 3.29605770111084, "train/negative_loss": 1.4074801206588745, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.8885774612426758, "train/total_loss": 0.8891231417655945 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.18757151067256927, "train/contrastive_loss": 1.8799256086349487, "train/negative_loss": 0.8823308944702148, "train/num_negatives": 36, "train/num_positives": 14, "train/positive_loss": 0.9975947141647339, "train/total_loss": 0.5635566115379333 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.17693592607975006, "train/contrastive_loss": 0.7002310156822205, "train/negative_loss": 0.7000147104263306, "train/num_negatives": 50, "train/num_positives": 2, "train/positive_loss": 0.0002163286553695798, "train/total_loss": 0.3169821500778198 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.10390909016132355, "train/contrastive_loss": 0.9423516988754272, "train/negative_loss": 0.6986709237098694, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.24368074536323547, "train/total_loss": 0.2923794388771057 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.16324786841869354, "train/contrastive_loss": 2.3501038551330566, "train/negative_loss": 1.442505121231079, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.9075987935066223, "train/total_loss": 0.6332686543464661 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.12983526289463043, "train/contrastive_loss": 1.7823537588119507, "train/negative_loss": 0.28791674971580505, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 1.4944369792938232, "train/total_loss": 0.48630601167678833 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.1586899310350418, "train/contrastive_loss": 2.7673845291137695, "train/negative_loss": 1.4687200784683228, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 1.2986645698547363, "train/total_loss": 0.7121668457984924 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.1976153403520584, "train/contrastive_loss": 2.9747040271759033, "train/negative_loss": 1.6252983808517456, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.3494056463241577, "train/total_loss": 0.7925561666488647 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.15510419011116028, "train/contrastive_loss": 1.403907060623169, "train/negative_loss": 0.6084649562835693, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.7954421043395996, "train/total_loss": 0.43588560819625854 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.14470325410366058, "train/contrastive_loss": 2.6630091667175293, "train/negative_loss": 0.42742475867271423, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 2.2355844974517822, "train/total_loss": 0.6773051023483276 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.161673441529274, "train/contrastive_loss": 1.0393285751342773, "train/negative_loss": 0.5355088710784912, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.5038197040557861, "train/total_loss": 0.36953914165496826 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.10991991311311722, "train/contrastive_loss": 1.0561574697494507, "train/negative_loss": 0.1740603744983673, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.882097065448761, "train/total_loss": 0.32115140557289124 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.17279328405857086, "train/contrastive_loss": 1.3032574653625488, "train/negative_loss": 0.4021962881088257, "train/num_negatives": 26, "train/num_positives": 20, "train/positive_loss": 0.9010611772537231, "train/total_loss": 0.4334447979927063 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.15077152848243713, "train/contrastive_loss": 1.6674673557281494, "train/negative_loss": 0.7585099935531616, "train/num_negatives": 42, "train/num_positives": 10, "train/positive_loss": 0.9089574217796326, "train/total_loss": 0.484264999628067 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.21579018235206604, "train/contrastive_loss": 3.4853367805480957, "train/negative_loss": 1.4509748220443726, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 2.0343618392944336, "train/total_loss": 0.9128575325012207 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.11221495270729065, "train/contrastive_loss": 1.077101230621338, "train/negative_loss": 1.0760865211486816, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.0010147526627406478, "train/total_loss": 0.3276351988315582 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.12250817567110062, "train/contrastive_loss": 2.709306478500366, "train/negative_loss": 1.8837618827819824, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.8255445957183838, "train/total_loss": 0.6643694639205933 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.16665510833263397, "train/contrastive_loss": 2.5002269744873047, "train/negative_loss": 2.378385066986084, "train/num_negatives": 46, "train/num_positives": 6, "train/positive_loss": 0.1218419224023819, "train/total_loss": 0.666700541973114 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.23845462501049042, "train/contrastive_loss": 2.1372268199920654, "train/negative_loss": 1.0707604885101318, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.0664663314819336, "train/total_loss": 0.6658999919891357 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.18439550697803497, "train/contrastive_loss": 3.084998607635498, "train/negative_loss": 1.116882562637329, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 1.9681161642074585, "train/total_loss": 0.8013952374458313 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.22670240700244904, "train/contrastive_loss": 2.1536686420440674, "train/negative_loss": 1.2204763889312744, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.9331921935081482, "train/total_loss": 0.6574361324310303 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.1767055243253708, "train/contrastive_loss": 1.5982882976531982, "train/negative_loss": 1.594626545906067, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 0.0036618048325181007, "train/total_loss": 0.49636316299438477 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.1886516511440277, "train/contrastive_loss": 0.33055827021598816, "train/negative_loss": 0.24170003831386566, "train/num_negatives": 32, "train/num_positives": 20, "train/positive_loss": 0.0888582244515419, "train/total_loss": 0.25476330518722534 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.2767840027809143, "train/contrastive_loss": 2.9796955585479736, "train/negative_loss": 1.500819206237793, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 1.4788763523101807, "train/total_loss": 0.8727231025695801 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.1781867891550064, "train/contrastive_loss": 0.8134265542030334, "train/negative_loss": 0.7134259939193726, "train/num_negatives": 38, "train/num_positives": 10, "train/positive_loss": 0.1000005379319191, "train/total_loss": 0.3408721089363098 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.15018221735954285, "train/contrastive_loss": 0.8663634657859802, "train/negative_loss": 0.7129050493240356, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 0.1534584015607834, "train/total_loss": 0.32345491647720337 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.14743544161319733, "train/contrastive_loss": 2.3652307987213135, "train/negative_loss": 1.2357358932495117, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.1294949054718018, "train/total_loss": 0.6204816102981567 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.1907016783952713, "train/contrastive_loss": 2.2304954528808594, "train/negative_loss": 1.0534167289733887, "train/num_negatives": 42, "train/num_positives": 12, "train/positive_loss": 1.1770786046981812, "train/total_loss": 0.6368007659912109 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.22363734245300293, "train/contrastive_loss": 2.555762767791748, "train/negative_loss": 1.7651923894882202, "train/num_negatives": 48, "train/num_positives": 6, "train/positive_loss": 0.7905704379081726, "train/total_loss": 0.7347899079322815 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.21107934415340424, "train/contrastive_loss": 1.508976697921753, "train/negative_loss": 0.9622426629066467, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.546734094619751, "train/total_loss": 0.5128746628761292 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.1506933569908142, "train/contrastive_loss": 2.156078815460205, "train/negative_loss": 2.156059503555298, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.9261493434896693e-05, "train/total_loss": 0.5819091200828552 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.19637171924114227, "train/contrastive_loss": 1.519548773765564, "train/negative_loss": 0.29067566990852356, "train/num_negatives": 46, "train/num_positives": 8, "train/positive_loss": 1.2288731336593628, "train/total_loss": 0.5002814531326294 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.24347355961799622, "train/contrastive_loss": 2.788450002670288, "train/negative_loss": 2.3680341243743896, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.42041581869125366, "train/total_loss": 0.8011635541915894 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.20849721133708954, "train/contrastive_loss": 0.7086260318756104, "train/negative_loss": 0.34195905923843384, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 0.3666669428348541, "train/total_loss": 0.3502224087715149 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.28504258394241333, "train/contrastive_loss": 3.280843734741211, "train/negative_loss": 1.3918296098709106, "train/num_negatives": 42, "train/num_positives": 8, "train/positive_loss": 1.8890140056610107, "train/total_loss": 0.9412113428115845 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.12758541107177734, "train/contrastive_loss": 0.9434974193572998, "train/negative_loss": 0.6942369341850281, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.24926047027111053, "train/total_loss": 0.3162848949432373 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.18063253164291382, "train/contrastive_loss": 2.559826374053955, "train/negative_loss": 1.1091228723526, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 1.450703501701355, "train/total_loss": 0.6925978064537048 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.14654940366744995, "train/contrastive_loss": 0.37958288192749023, "train/negative_loss": 0.3795297145843506, "train/num_negatives": 50, "train/num_positives": 4, "train/positive_loss": 5.3169023885857314e-05, "train/total_loss": 0.22246599197387695 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.2653622329235077, "train/contrastive_loss": 0.40057963132858276, "train/negative_loss": 0.3929031789302826, "train/num_negatives": 50, "train/num_positives": 6, "train/positive_loss": 0.0076764412224292755, "train/total_loss": 0.3454781770706177 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.15090252459049225, "train/contrastive_loss": 0.6711095571517944, "train/negative_loss": 0.5360282063484192, "train/num_negatives": 40, "train/num_positives": 12, "train/positive_loss": 0.13508135080337524, "train/total_loss": 0.28512442111968994 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.3246062099933624, "train/contrastive_loss": 2.254579782485962, "train/negative_loss": 1.4058345556259155, "train/num_negatives": 30, "train/num_positives": 18, "train/positive_loss": 0.8487451672554016, "train/total_loss": 0.7755221724510193 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.1271226704120636, "train/contrastive_loss": 2.638763427734375, "train/negative_loss": 0.6320816874504089, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 2.0066816806793213, "train/total_loss": 0.6548753976821899 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.18041278421878815, "train/contrastive_loss": 2.6744189262390137, "train/negative_loss": 2.264373302459717, "train/num_negatives": 42, "train/num_positives": 14, "train/positive_loss": 0.4100455641746521, "train/total_loss": 0.7152965664863586 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.300018310546875, "train/contrastive_loss": 2.5565543174743652, "train/negative_loss": 2.5565528869628906, "train/num_negatives": 48, "train/num_positives": 2, "train/positive_loss": 1.3113030945532955e-06, "train/total_loss": 0.811329185962677 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.2101355493068695, "train/contrastive_loss": 3.068310260772705, "train/negative_loss": 1.3865567445755005, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 1.681753396987915, "train/total_loss": 0.8237975835800171 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.12214487046003342, "train/contrastive_loss": 0.7940738797187805, "train/negative_loss": 0.2134452909231186, "train/num_negatives": 36, "train/num_positives": 12, "train/positive_loss": 0.5806285738945007, "train/total_loss": 0.2809596359729767 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.21674410998821259, "train/contrastive_loss": 0.9268835186958313, "train/negative_loss": 0.6917107701301575, "train/num_negatives": 40, "train/num_positives": 8, "train/positive_loss": 0.23517273366451263, "train/total_loss": 0.40212082862854004 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.17498879134655, "train/contrastive_loss": 1.4075732231140137, "train/negative_loss": 1.0333727598190308, "train/num_negatives": 38, "train/num_positives": 14, "train/positive_loss": 0.37420040369033813, "train/total_loss": 0.4565034508705139 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.32710063457489014, "train/contrastive_loss": 3.023778200149536, "train/negative_loss": 0.9421355128288269, "train/num_negatives": 36, "train/num_positives": 6, "train/positive_loss": 2.0816426277160645, "train/total_loss": 0.9318562746047974 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.13638830184936523, "train/contrastive_loss": 0.8297756910324097, "train/negative_loss": 0.26942458748817444, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 0.5603510737419128, "train/total_loss": 0.3023434281349182 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.12461970746517181, "train/contrastive_loss": 0.5863827466964722, "train/negative_loss": 0.35135072469711304, "train/num_negatives": 34, "train/num_positives": 22, "train/positive_loss": 0.23503205180168152, "train/total_loss": 0.24189625680446625 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.1512128710746765, "train/contrastive_loss": 2.0193936824798584, "train/negative_loss": 0.9081525206565857, "train/num_negatives": 52, "train/num_positives": 4, "train/positive_loss": 1.111241102218628, "train/total_loss": 0.5550916194915771 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.20463521778583527, "train/contrastive_loss": 2.241032123565674, "train/negative_loss": 1.4335198402404785, "train/num_negatives": 46, "train/num_positives": 4, "train/positive_loss": 0.8075124025344849, "train/total_loss": 0.6528416275978088 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.19932608306407928, "train/contrastive_loss": 1.1772005558013916, "train/negative_loss": 0.46148422360420227, "train/num_negatives": 38, "train/num_positives": 12, "train/positive_loss": 0.7157163619995117, "train/total_loss": 0.4347662031650543 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.07740391045808792, "train/contrastive_loss": 0.21475635468959808, "train/negative_loss": 0.18394051492214203, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.030815843492746353, "train/total_loss": 0.12035518139600754 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.20169365406036377, "train/contrastive_loss": 2.285486936569214, "train/negative_loss": 1.5728172063827515, "train/num_negatives": 40, "train/num_positives": 10, "train/positive_loss": 0.7126697897911072, "train/total_loss": 0.6587910652160645 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.20289531350135803, "train/contrastive_loss": 1.0738251209259033, "train/negative_loss": 1.0522583723068237, "train/num_negatives": 46, "train/num_positives": 2, "train/positive_loss": 0.021566739305853844, "train/total_loss": 0.41766035556793213 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.16088584065437317, "train/contrastive_loss": 2.5070641040802, "train/negative_loss": 1.0180082321166992, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.489055871963501, "train/total_loss": 0.6622986793518066 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.18439029157161713, "train/contrastive_loss": 1.3094674348831177, "train/negative_loss": 0.7377079129219055, "train/num_negatives": 40, "train/num_positives": 16, "train/positive_loss": 0.5717595219612122, "train/total_loss": 0.446283757686615 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.171571284532547, "train/contrastive_loss": 2.0250818729400635, "train/negative_loss": 0.44625118374824524, "train/num_negatives": 44, "train/num_positives": 8, "train/positive_loss": 1.578830599784851, "train/total_loss": 0.5765876770019531 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.12282082438468933, "train/contrastive_loss": 0.7972508072853088, "train/negative_loss": 0.7972486615180969, "train/num_negatives": 34, "train/num_positives": 20, "train/positive_loss": 2.1338505575840827e-06, "train/total_loss": 0.28227096796035767 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.16165323555469513, "train/contrastive_loss": 1.1839613914489746, "train/negative_loss": 0.4316282272338867, "train/num_negatives": 46, "train/num_positives": 10, "train/positive_loss": 0.7523331046104431, "train/total_loss": 0.3984455168247223 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.20239406824111938, "train/contrastive_loss": 2.348005533218384, "train/negative_loss": 1.31099534034729, "train/num_negatives": 48, "train/num_positives": 8, "train/positive_loss": 1.0370101928710938, "train/total_loss": 0.6719951629638672 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.16138069331645966, "train/contrastive_loss": 2.599496841430664, "train/negative_loss": 1.0955849885940552, "train/num_negatives": 44, "train/num_positives": 12, "train/positive_loss": 1.5039119720458984, "train/total_loss": 0.6812800765037537 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.2602480351924896, "train/contrastive_loss": 1.3008562326431274, "train/negative_loss": 0.9205397367477417, "train/num_negatives": 44, "train/num_positives": 6, "train/positive_loss": 0.38031646609306335, "train/total_loss": 0.5204192996025085 }, { "epoch": 11.971830985915492, "step": 3400, "train/classification_loss": 0.1769106090068817, "train/contrastive_loss": 0.6750936508178711, "train/negative_loss": 0.6715583801269531, "train/num_negatives": 32, "train/num_positives": 8, "train/positive_loss": 0.00353529816493392, "train/total_loss": 0.3119293451309204 }, { "epoch": 11.971830985915492, "eval_exact_match_accuracy": 0.31746031746031744, "eval_hamming_loss": 0.0665006743438116, "eval_loss": 0.5517120361328125, "eval_macro_f1": 0.4510166791146767, "eval_macro_precision": 0.6677478588667094, "eval_macro_recall": 0.3737002146225135, "eval_micro_f1": 0.5706630944407234, "eval_micro_precision": 0.7675675675675676, "eval_micro_recall": 0.4541577825159915, "eval_runtime": 2.8549, "eval_samples_per_second": 198.606, "eval_steps_per_second": 24.869, "step": 3400 }, { "epoch": 11.971830985915492, "step": 3400, "total_flos": 0.0, "train_loss": 0.9307791737949147, "train_runtime": 983.1644, "train_samples_per_second": 2307.854, "train_steps_per_second": 144.432 } ], "logging_steps": 50, "max_steps": 142000, "num_input_tokens_seen": 0, "num_train_epochs": 500, "save_steps": 2000, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 5, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 0 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }