maximuspowers commited on
Commit
38a9168
·
verified ·
1 Parent(s): 108859b

Training in progress, step 50

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:216c5222dbcb5ff5f52be7e8f46a9e2b8eafc2fcae66f4d5dcf5f48ec85747f8
3
  size 441154988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1da099a0d87099a0b0c9bbf7ea0ae5a6eabcb8d3810f4e9df2b957493c6c6cd5
3
  size 441154988
runs/Jun15_00-36-15_92b2e0e6fb20/events.out.tfevents.1749947776.92b2e0e6fb20.2194.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68675bc2ed356d6254de5ab1384465e36b4be95c84b4e8a3d42ed7285f48064e
3
+ size 4184
runs/Jun15_00-36-38_92b2e0e6fb20/events.out.tfevents.1749947799.92b2e0e6fb20.2194.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b53fa14b07f1f332f117f6e642eab76308f876681d29b0a1619b45f1a1bf7b14
3
+ size 7232
trainer_state.json ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 5.0,
6
+ "eval_steps": 250,
7
+ "global_step": 50,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0,
14
+ "step": 0,
15
+ "train/classification_loss": 0.6716318130493164,
16
+ "train/contrastive_loss": 6.973960876464844,
17
+ "train/negative_loss": 6.973352909088135,
18
+ "train/num_negatives": 190,
19
+ "train/num_positives": 50,
20
+ "train/positive_loss": 0.0006079699960537255,
21
+ "train/total_loss": 2.0664238929748535
22
+ },
23
+ {
24
+ "epoch": 0,
25
+ "step": 0,
26
+ "train/classification_loss": 0.6844258904457092,
27
+ "train/contrastive_loss": 6.779294490814209,
28
+ "train/negative_loss": 6.7774882316589355,
29
+ "train/num_negatives": 192,
30
+ "train/num_positives": 48,
31
+ "train/positive_loss": 0.0018063625320792198,
32
+ "train/total_loss": 2.0402848720550537
33
+ },
34
+ {
35
+ "epoch": 5.0,
36
+ "grad_norm": 5.838413238525391,
37
+ "learning_rate": 9.800000000000001e-06,
38
+ "loss": 1.4132,
39
+ "step": 50
40
+ },
41
+ {
42
+ "epoch": 5.0,
43
+ "step": 50,
44
+ "total_flos": 0.0,
45
+ "train_loss": 1.413243408203125,
46
+ "train_runtime": 29.4518,
47
+ "train_samples_per_second": 53.647,
48
+ "train_steps_per_second": 1.698
49
+ }
50
+ ],
51
+ "logging_steps": 50,
52
+ "max_steps": 50,
53
+ "num_input_tokens_seen": 0,
54
+ "num_train_epochs": 5,
55
+ "save_steps": 500,
56
+ "stateful_callbacks": {
57
+ "EarlyStoppingCallback": {
58
+ "args": {
59
+ "early_stopping_patience": 3,
60
+ "early_stopping_threshold": 0.0
61
+ },
62
+ "attributes": {
63
+ "early_stopping_patience_counter": 0
64
+ }
65
+ },
66
+ "TrainerControl": {
67
+ "args": {
68
+ "should_epoch_stop": false,
69
+ "should_evaluate": false,
70
+ "should_log": false,
71
+ "should_save": true,
72
+ "should_training_stop": true
73
+ },
74
+ "attributes": {}
75
+ }
76
+ },
77
+ "total_flos": 0.0,
78
+ "train_batch_size": 16,
79
+ "trial_name": null,
80
+ "trial_params": null
81
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1cf55407d703d9184ef351e313b0bda1b55c3a6bf45440f6046ba6213b87acd0
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ca0afef15a0edecfaa88b54e14baf2e856c7793f28bd79fd10178152b6b37f8
3
  size 5368