maximuspowers commited on
Commit
9cbf8ba
·
verified ·
1 Parent(s): e6f645a

Training in progress, step 50

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1da099a0d87099a0b0c9bbf7ea0ae5a6eabcb8d3810f4e9df2b957493c6c6cd5
3
  size 441154988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b28070514a109f4c6d0cc6bd89ef87ea76348c26aa37d820b2eae9f6195c9738
3
  size 441154988
runs/Jun15_00-36-15_92b2e0e6fb20/events.out.tfevents.1749947776.92b2e0e6fb20.2194.3 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68675bc2ed356d6254de5ab1384465e36b4be95c84b4e8a3d42ed7285f48064e
3
- size 4184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:079f4dbb466565a0431e8d93f99f888ff9e82d727edf190150726236219a2b76
3
+ size 5717
runs/Jun15_00-36-38_92b2e0e6fb20/events.out.tfevents.1749947875.92b2e0e6fb20.2194.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04ffe1a33d90bbbfe16f83cd44b5ae14ccb0afef611397e6a0dc4dbbdcdaa40
3
+ size 1576
runs/Jun15_00-38-20_92b2e0e6fb20/events.out.tfevents.1749947901.92b2e0e6fb20.2194.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80235aca5bb0dd08f3e6284a80b3b9bd4ea63ff47c20ab63860a05bdf5217df3
3
+ size 7232
trainer_state.json CHANGED
@@ -12,40 +12,40 @@
12
  {
13
  "epoch": 0,
14
  "step": 0,
15
- "train/classification_loss": 0.6716318130493164,
16
- "train/contrastive_loss": 6.973960876464844,
17
- "train/negative_loss": 6.973352909088135,
18
  "train/num_negatives": 190,
19
  "train/num_positives": 50,
20
- "train/positive_loss": 0.0006079699960537255,
21
- "train/total_loss": 2.0664238929748535
22
  },
23
  {
24
  "epoch": 0,
25
  "step": 0,
26
- "train/classification_loss": 0.6844258904457092,
27
- "train/contrastive_loss": 6.779294490814209,
28
- "train/negative_loss": 6.7774882316589355,
29
  "train/num_negatives": 192,
30
  "train/num_positives": 48,
31
- "train/positive_loss": 0.0018063625320792198,
32
- "train/total_loss": 2.0402848720550537
33
  },
34
  {
35
  "epoch": 5.0,
36
- "grad_norm": 5.838413238525391,
37
  "learning_rate": 9.800000000000001e-06,
38
- "loss": 1.4132,
39
  "step": 50
40
  },
41
  {
42
  "epoch": 5.0,
43
  "step": 50,
44
  "total_flos": 0.0,
45
- "train_loss": 1.413243408203125,
46
- "train_runtime": 29.4518,
47
- "train_samples_per_second": 53.647,
48
- "train_steps_per_second": 1.698
49
  }
50
  ],
51
  "logging_steps": 50,
 
12
  {
13
  "epoch": 0,
14
  "step": 0,
15
+ "train/classification_loss": 0.6832770109176636,
16
+ "train/contrastive_loss": 7.157876014709473,
17
+ "train/negative_loss": 7.157375812530518,
18
  "train/num_negatives": 190,
19
  "train/num_positives": 50,
20
+ "train/positive_loss": 0.0005001117824576795,
21
+ "train/total_loss": 2.1148521900177
22
  },
23
  {
24
  "epoch": 0,
25
  "step": 0,
26
+ "train/classification_loss": 0.691846489906311,
27
+ "train/contrastive_loss": 6.978695392608643,
28
+ "train/negative_loss": 6.977847576141357,
29
  "train/num_negatives": 192,
30
  "train/num_positives": 48,
31
+ "train/positive_loss": 0.0008476818911731243,
32
+ "train/total_loss": 2.08758544921875
33
  },
34
  {
35
  "epoch": 5.0,
36
+ "grad_norm": 9.853194236755371,
37
  "learning_rate": 9.800000000000001e-06,
38
+ "loss": 2.9901,
39
  "step": 50
40
  },
41
  {
42
  "epoch": 5.0,
43
  "step": 50,
44
  "total_flos": 0.0,
45
+ "train_loss": 2.9900537109375,
46
+ "train_runtime": 27.9302,
47
+ "train_samples_per_second": 56.57,
48
+ "train_steps_per_second": 1.79
49
  }
50
  ],
51
  "logging_steps": 50,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ca0afef15a0edecfaa88b54e14baf2e856c7793f28bd79fd10178152b6b37f8
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c02a3dbfbd9db3f1e4a919c78948efb8eb944344dc26585f19fc5dded995095b
3
  size 5368