Training in progress, step 5000

Files changed (9) hide show

config.json CHANGED Viewed

@@ -3,7 +3,7 @@
   "architectures": [
     "BigBirdForQuestionAnswering"
   ],
-  "attention_probs_dropout_prob": 0.3,
   "attention_type": "block_sparse",
   "block_size": 16,
   "bos_token_id": 1,

   "architectures": [
     "BigBirdForQuestionAnswering"
   ],
+  "attention_probs_dropout_prob": 0.1,
   "attention_type": "block_sparse",
   "block_size": 16,
   "bos_token_id": 1,

eval_nbest_predictions.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:96cb0d3293d11d08f52308b9eb1dd5cda66f504f040755b86744568624262701
-size 46247000

 version https://git-lfs.github.com/spec/v1
+oid sha256:247c7ecdd25ffafd745715b99e4b060789ea645d6deb6951094f68c9dd8943ae
+size 45803384

eval_predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5d0f04062b372dd2b54b7aa5b94f5ff75d9310ac875a43455e8625f78d019981
 size 1465632968

 version https://git-lfs.github.com/spec/v1
+oid sha256:b76c675eb8386ae59af895a6d0c2f5a0c0a2f81b49f6d73e59507ea258b64c5e
 size 1465632968

runs/events.out.tfevents.1723780259.isl-gpu4.2545635.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:50d3009ee4ab44c43e3dffc57eb8463fd3e0b6e6b1f196ba9e9739996bcb5aa6
-size 27091

 version https://git-lfs.github.com/spec/v1
+oid sha256:9f32ece778a06e24196937c21a622e71499ae31f825c8ca2b76623400d30c864
+size 37754

runs/events.out.tfevents.1723800445.isl-gpu4.2837113.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:83de2e76bf26f7c6b512483103dd2af2139ad87318ce3ce289ae0373ac2514af
+size 27093

runs/events.out.tfevents.1723800445.isl-gpu4.2837114.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:13f861b07b6ca95e3db6add6a657cc612b9e4f6a50beb57e2b06e8eeecb9f5df
+size 88

tokenizer.json CHANGED Viewed

@@ -1,21 +1,7 @@
 {
   "version": "1.0",
-  "truncation": {
-    "direction": "Right",
-    "max_length": 4096,
-    "strategy": "OnlySecond",
-    "stride": 128
-  },
-  "padding": {
-    "strategy": {
-      "Fixed": 4096
-    },
-    "direction": "Right",
-    "pad_to_multiple_of": null,
-    "pad_id": 0,
-    "pad_type_id": 0,
-    "pad_token": "<pad>"
-  },
   "added_tokens": [
     {
       "id": 0,

 {
   "version": "1.0",
+  "truncation": null,
+  "padding": null,
   "added_tokens": [
     {
       "id": 0,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:541cb5eff113a830e24236aebf7b94d2b933afd215e37928b0e8e1975f77d03a
 size 4911

 version https://git-lfs.github.com/spec/v1
+oid sha256:6752ee353cbae13420becfe4db048b3fe11da7af83b5a24eea502e62b9a8d2ec
 size 4911