radic2682 commited on
Commit
2c0376c
·
verified ·
1 Parent(s): 1c98682

Training in progress, step 5000

Browse files
config.json CHANGED
@@ -3,7 +3,7 @@
3
  "architectures": [
4
  "BigBirdForQuestionAnswering"
5
  ],
6
- "attention_probs_dropout_prob": 0.3,
7
  "attention_type": "block_sparse",
8
  "block_size": 16,
9
  "bos_token_id": 1,
 
3
  "architectures": [
4
  "BigBirdForQuestionAnswering"
5
  ],
6
+ "attention_probs_dropout_prob": 0.1,
7
  "attention_type": "block_sparse",
8
  "block_size": 16,
9
  "bos_token_id": 1,
eval_nbest_predictions.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96cb0d3293d11d08f52308b9eb1dd5cda66f504f040755b86744568624262701
3
- size 46247000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:247c7ecdd25ffafd745715b99e4b060789ea645d6deb6951094f68c9dd8943ae
3
+ size 45803384
eval_predictions.json CHANGED
The diff for this file is too large to render. See raw diff
 
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d0f04062b372dd2b54b7aa5b94f5ff75d9310ac875a43455e8625f78d019981
3
  size 1465632968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b76c675eb8386ae59af895a6d0c2f5a0c0a2f81b49f6d73e59507ea258b64c5e
3
  size 1465632968
runs/events.out.tfevents.1723780259.isl-gpu4.2545635.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:50d3009ee4ab44c43e3dffc57eb8463fd3e0b6e6b1f196ba9e9739996bcb5aa6
3
- size 27091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f32ece778a06e24196937c21a622e71499ae31f825c8ca2b76623400d30c864
3
+ size 37754
runs/events.out.tfevents.1723800445.isl-gpu4.2837113.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83de2e76bf26f7c6b512483103dd2af2139ad87318ce3ce289ae0373ac2514af
3
+ size 27093
runs/events.out.tfevents.1723800445.isl-gpu4.2837114.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13f861b07b6ca95e3db6add6a657cc612b9e4f6a50beb57e2b06e8eeecb9f5df
3
+ size 88
tokenizer.json CHANGED
@@ -1,21 +1,7 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 4096,
6
- "strategy": "OnlySecond",
7
- "stride": 128
8
- },
9
- "padding": {
10
- "strategy": {
11
- "Fixed": 4096
12
- },
13
- "direction": "Right",
14
- "pad_to_multiple_of": null,
15
- "pad_id": 0,
16
- "pad_type_id": 0,
17
- "pad_token": "<pad>"
18
- },
19
  "added_tokens": [
20
  {
21
  "id": 0,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:541cb5eff113a830e24236aebf7b94d2b933afd215e37928b0e8e1975f77d03a
3
  size 4911
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6752ee353cbae13420becfe4db048b3fe11da7af83b5a24eea502e62b9a8d2ec
3
  size 4911