wangyichen25 commited on
Commit
26dc7f7
·
verified ·
1 Parent(s): 8909a9a

Training in progress, step 20, checkpoint

Browse files
checkpoint-20/adapter_config.json CHANGED
@@ -28,16 +28,16 @@
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
31
- "o_proj",
32
- "k_proj",
33
- "gate_proj",
34
  "fc1",
 
 
 
35
  "q_proj",
36
- "v_proj",
37
  "up_proj",
38
  "down_proj",
39
- "out_proj",
40
- "fc2"
41
  ],
42
  "task_type": "CAUSAL_LM",
43
  "trainable_token_indices": null,
 
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
 
 
 
31
  "fc1",
32
+ "o_proj",
33
+ "fc2",
34
+ "out_proj",
35
  "q_proj",
36
+ "gate_proj",
37
  "up_proj",
38
  "down_proj",
39
+ "v_proj",
40
+ "k_proj"
41
  ],
42
  "task_type": "CAUSAL_LM",
43
  "trainable_token_indices": null,
checkpoint-20/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e3cb107c01a3c7342a51f5cc8e1090b035ba2a13268420756a95f0d6114f559
3
  size 2839126480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdda4478dbd5bd2e9d6fd020c8f89c04cf43e9c7cb839ca8e27ec76a4814e478
3
  size 2839126480
checkpoint-20/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:505d1a7a195c72587d286c26793412f1e849b8018ee6d531b15e3ed2b296593e
3
  size 5678690152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3351616e75477416da57bccd262ac5d6967d67143486d25c6ba87cc889a3b844
3
  size 5678690152
checkpoint-20/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a7c19685927162de419f962184a4ce06ccfb2a3441588f0dc66e1e7594957f3
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:142e5c3a83ea588f932553c5bde7b70bfd98ed130ade922e3cb2e56b069aacf3
3
  size 14244
checkpoint-20/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46f456ef683d11200f96f387b8eee25e5e55fcabcb7dc642edf15ecd17d4d595
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43b8a7fc5388dd8f77109db1fef12582ae17574ccfc9b9d15825551c90221061
3
  size 1064
checkpoint-20/trainer_state.json CHANGED
@@ -3,36 +3,55 @@
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
  "epoch": 0.38461538461538464,
6
- "eval_steps": 20,
7
  "global_step": 20,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  {
13
  "epoch": 0.38461538461538464,
14
- "grad_norm": 2.9819071292877197,
15
- "learning_rate": 0.00017,
16
- "loss": 2.4045,
17
- "mean_token_accuracy": 0.9366250112652779,
18
  "num_tokens": 98240.0,
19
  "step": 20
20
  },
21
  {
22
  "epoch": 0.38461538461538464,
23
- "eval_loss": 0.04179316386580467,
24
- "eval_mean_token_accuracy": 0.9780769439843985,
25
  "eval_num_tokens": 98240.0,
26
- "eval_runtime": 17.9013,
27
- "eval_samples_per_second": 2.793,
28
- "eval_steps_per_second": 0.726,
29
  "step": 20
30
  }
31
  ],
32
- "logging_steps": 20,
33
- "max_steps": 104,
34
  "num_input_tokens_seen": 0,
35
- "num_train_epochs": 2,
36
  "save_steps": 20,
37
  "stateful_callbacks": {
38
  "TrainerControl": {
 
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
  "epoch": 0.38461538461538464,
6
+ "eval_steps": 10,
7
  "global_step": 20,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
12
+ {
13
+ "epoch": 0.19230769230769232,
14
+ "grad_norm": 21.498493194580078,
15
+ "learning_rate": 0.00019470198675496689,
16
+ "loss": 14.4551,
17
+ "mean_token_accuracy": 0.6612499989569187,
18
+ "num_tokens": 49120.0,
19
+ "step": 10
20
+ },
21
+ {
22
+ "epoch": 0.19230769230769232,
23
+ "eval_loss": 1.0248602628707886,
24
+ "eval_mean_token_accuracy": 0.8969230560156015,
25
+ "eval_num_tokens": 49120.0,
26
+ "eval_runtime": 17.9265,
27
+ "eval_samples_per_second": 2.789,
28
+ "eval_steps_per_second": 0.725,
29
+ "step": 10
30
+ },
31
  {
32
  "epoch": 0.38461538461538464,
33
+ "grad_norm": 6.777862071990967,
34
+ "learning_rate": 0.00018145695364238411,
35
+ "loss": 2.185,
36
+ "mean_token_accuracy": 0.9445000052452087,
37
  "num_tokens": 98240.0,
38
  "step": 20
39
  },
40
  {
41
  "epoch": 0.38461538461538464,
42
+ "eval_loss": 0.13720029592514038,
43
+ "eval_mean_token_accuracy": 0.9761538688953106,
44
  "eval_num_tokens": 98240.0,
45
+ "eval_runtime": 17.8731,
46
+ "eval_samples_per_second": 2.797,
47
+ "eval_steps_per_second": 0.727,
48
  "step": 20
49
  }
50
  ],
51
+ "logging_steps": 10,
52
+ "max_steps": 156,
53
  "num_input_tokens_seen": 0,
54
+ "num_train_epochs": 3,
55
  "save_steps": 20,
56
  "stateful_callbacks": {
57
  "TrainerControl": {
checkpoint-20/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2661e9d16a322a8b69865bc4b33ea73e1b304a23fa93839c76bab58d65645833
3
  size 5816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:652c8ce42c66ba23561de837fae1da08a712795400ecc170511dcf7fa6b44940
3
  size 5816