Saving weights and logs of step 10000

Files changed (3) hide show

events.out.tfevents.1642492715.t1v-n-e1a08808-w-0.1951911.0.v2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b20363f7e352b84ee407aa02c64a00386a9d87f87d6cc568e79718c957b0f7c7
+size 1470136

flax_model.msgpack CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31e38a8e41f06efe2d65f49514bd7f9aebf78a271aae60752027cba7177e43b8
 size 498796983

 version https://git-lfs.github.com/spec/v1
+oid sha256:471773a4c40956dc70a98b851522d92b8e06775b2c48aae8056a20ac9de4de07
 size 498796983

run_step3.sh CHANGED Viewed

@@ -12,8 +12,8 @@
     --per_device_train_batch_size="192" \
     --per_device_eval_batch_size="192" \
     --learning_rate="4e-4" \
-    --end_learning_rate="2e-4" \
-    --warmup_steps="0" \
     --overwrite_output_dir \
     --num_train_epochs="1" \
     --adam_beta1="0.9" \

     --per_device_train_batch_size="192" \
     --per_device_eval_batch_size="192" \
     --learning_rate="4e-4" \
+    --end_learning_rate="1e-4" \
+    --warmup_steps="10000" \
     --overwrite_output_dir \
     --num_train_epochs="1" \
     --adam_beta1="0.9" \