Training in progress, step 250

Files changed (5) hide show

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:15ab6d53f86a358ee5df321f4b7a089a1640a875f053cda5bfe5c041e0b9f108
 size 18915328

 version https://git-lfs.github.com/spec/v1
+oid sha256:a378b6eb3ef94fe5e0fe0232b088bc46401b578c8996d011311fa144e77ab67b
 size 18915328

all_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-    "epoch": 5.0,
-    "total_flos": 12502279618560.0,
-    "train_loss": 1.1522993087768554,
-    "train_runtime": 5.217,
-    "train_samples_per_second": 3.834,
-    "train_steps_per_second": 0.958
 }

 {
+    "epoch": 10.0,
+    "total_flos": 122531399884800.0,
+    "train_loss": 0.3025847053527832,
+    "train_runtime": 63.1156,
+    "train_samples_per_second": 3.169,
+    "train_steps_per_second": 3.169
 }

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-    "epoch": 5.0,
-    "total_flos": 12502279618560.0,
-    "train_loss": 1.1522993087768554,
-    "train_runtime": 5.217,
-    "train_samples_per_second": 3.834,
-    "train_steps_per_second": 0.958
 }

 {
+    "epoch": 10.0,
+    "total_flos": 122531399884800.0,
+    "train_loss": 0.3025847053527832,
+    "train_runtime": 63.1156,
+    "train_samples_per_second": 3.169,
+    "train_steps_per_second": 3.169
 }

trainer_state.json CHANGED Viewed

@@ -1,27 +1,27 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 5.0,
   "eval_steps": 500,
-  "global_step": 5,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 5.0,
-      "step": 5,
-      "total_flos": 12502279618560.0,
-      "train_loss": 1.1522993087768554,
-      "train_runtime": 5.217,
-      "train_samples_per_second": 3.834,
-      "train_steps_per_second": 0.958
     }
   ],
   "logging_steps": 500,
-  "max_steps": 5,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 5,
   "save_steps": 500,
   "stateful_callbacks": {
     "TrainerControl": {
@@ -35,8 +35,8 @@
       "attributes": {}
     }
   },
-  "total_flos": 12502279618560.0,
-  "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 10.0,
   "eval_steps": 500,
+  "global_step": 200,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 10.0,
+      "step": 200,
+      "total_flos": 122531399884800.0,
+      "train_loss": 0.3025847053527832,
+      "train_runtime": 63.1156,
+      "train_samples_per_second": 3.169,
+      "train_steps_per_second": 3.169
     }
   ],
   "logging_steps": 500,
+  "max_steps": 200,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
   "save_steps": 500,
   "stateful_callbacks": {
     "TrainerControl": {
       "attributes": {}
     }
   },
+  "total_flos": 122531399884800.0,
+  "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:78217b65b5bd4d0c9c0f663c5b1d78d9e274c81fdd94f8fbd0ad858ed500c640
 size 5496

 version https://git-lfs.github.com/spec/v1
+oid sha256:d3f1cbe973f169051d1c78945511b0e6eb73a6057cd99ce7bd3c87275d1a4d80
 size 5496