Training in progress, step 500

Files changed (7) hide show

all_results.json CHANGED Viewed

@@ -1,5 +1,17 @@
 {
     "epoch": 5.0,
     "total_flos": 0.0,
     "train_loss": 1.6828109741210937,
     "train_runtime": 29.5351,

 {
     "epoch": 5.0,
+    "eval_exact_match_accuracy": 0.2,
+    "eval_hamming_loss": 0.075,
+    "eval_loss": 0.8420153856277466,
+    "eval_macro_f1": 0.09192664920219099,
+    "eval_macro_precision": 0.09243697478991597,
+    "eval_macro_recall": 0.09215686274509804,
+    "eval_micro_f1": 0.4,
+    "eval_micro_precision": 0.6071428571428571,
+    "eval_micro_recall": 0.2982456140350877,
+    "eval_runtime": 0.2221,
+    "eval_samples_per_second": 180.125,
+    "eval_steps_per_second": 13.509,
     "total_flos": 0.0,
     "train_loss": 1.6828109741210937,
     "train_runtime": 29.5351,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b28070514a109f4c6d0cc6bd89ef87ea76348c26aa37d820b2eae9f6195c9738
 size 441154988

 version https://git-lfs.github.com/spec/v1
+oid sha256:2d090d5e2966f2091768ffc79be690bc37433eae61a697aae158a43c8f2c1826
 size 441154988

runs/Jun15_00-38-20_92b2e0e6fb20/events.out.tfevents.1749947964.92b2e0e6fb20.2194.7 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:57c3147ab3f0cf9d900aafcf566f061e709215d31fd0c96edc7852d2af79588d
+size 3776

runs/Jun15_00-40-18_92b2e0e6fb20/events.out.tfevents.1749948019.92b2e0e6fb20.2194.8 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a88e4afb6c8a434d92c19def97557910319f634b24c709e67acb9de318f8594f
+size 22648

test_results.json ADDED Viewed

+{
+    "epoch": 5.0,
+    "eval_exact_match_accuracy": 0.2,
+    "eval_hamming_loss": 0.075,
+    "eval_loss": 0.8420153856277466,
+    "eval_macro_f1": 0.09192664920219099,
+    "eval_macro_precision": 0.09243697478991597,
+    "eval_macro_recall": 0.09215686274509804,
+    "eval_micro_f1": 0.4,
+    "eval_micro_precision": 0.6071428571428571,
+    "eval_micro_recall": 0.2982456140350877,
+    "eval_runtime": 0.2221,
+    "eval_samples_per_second": 180.125,
+    "eval_steps_per_second": 13.509
+}

trainer_state.json CHANGED Viewed

@@ -12,40 +12,40 @@
     {
       "epoch": 0,
       "step": 0,
-      "train/classification_loss": 0.6832770109176636,
-      "train/contrastive_loss": 7.157876014709473,
-      "train/negative_loss": 7.157375812530518,
       "train/num_negatives": 190,
       "train/num_positives": 50,
-      "train/positive_loss": 0.0005001117824576795,
-      "train/total_loss": 2.1148521900177
     },
     {
       "epoch": 0,
       "step": 0,
-      "train/classification_loss": 0.691846489906311,
-      "train/contrastive_loss": 6.978695392608643,
-      "train/negative_loss": 6.977847576141357,
       "train/num_negatives": 192,
       "train/num_positives": 48,
-      "train/positive_loss": 0.0008476818911731243,
-      "train/total_loss": 2.08758544921875
     },
     {
       "epoch": 5.0,
-      "grad_norm": 9.853194236755371,
       "learning_rate": 9.800000000000001e-06,
-      "loss": 2.9901,
       "step": 50
     },
     {
       "epoch": 5.0,
       "step": 50,
       "total_flos": 0.0,
-      "train_loss": 2.9900537109375,
-      "train_runtime": 27.9302,
-      "train_samples_per_second": 56.57,
-      "train_steps_per_second": 1.79
     }
   ],
   "logging_steps": 50,

     {
       "epoch": 0,
       "step": 0,
+      "train/classification_loss": 0.6251798272132874,
+      "train/contrastive_loss": 1.386080265045166,
+      "train/negative_loss": 1.1070373058319092,
       "train/num_negatives": 190,
       "train/num_positives": 50,
+      "train/positive_loss": 0.27904292941093445,
+      "train/total_loss": 0.9023958444595337
     },
     {
       "epoch": 0,
       "step": 0,
+      "train/classification_loss": 0.6276130080223083,
+      "train/contrastive_loss": 1.6681630611419678,
+      "train/negative_loss": 1.269258737564087,
       "train/num_negatives": 192,
       "train/num_positives": 48,
+      "train/positive_loss": 0.39890438318252563,
+      "train/total_loss": 0.9612456560134888
     },
     {
       "epoch": 5.0,
+      "grad_norm": 10.065888404846191,
       "learning_rate": 9.800000000000001e-06,
+      "loss": 1.6828,
       "step": 50
     },
     {
       "epoch": 5.0,
       "step": 50,
       "total_flos": 0.0,
+      "train_loss": 1.6828109741210937,
+      "train_runtime": 29.5351,
+      "train_samples_per_second": 53.496,
+      "train_steps_per_second": 1.693
     }
   ],
   "logging_steps": 50,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c02a3dbfbd9db3f1e4a919c78948efb8eb944344dc26585f19fc5dded995095b
 size 5368

 version https://git-lfs.github.com/spec/v1
+oid sha256:03e2d330b9dd8fe925b85bea0db478c22579b7da080ec4cac0c4183a4c7358e0
 size 5368