Training in progress, step 50
Browse files- model.safetensors +1 -1
- runs/Jun15_00-36-15_92b2e0e6fb20/events.out.tfevents.1749947776.92b2e0e6fb20.2194.3 +2 -2
- runs/Jun15_00-36-38_92b2e0e6fb20/events.out.tfevents.1749947875.92b2e0e6fb20.2194.5 +3 -0
- runs/Jun15_00-38-20_92b2e0e6fb20/events.out.tfevents.1749947901.92b2e0e6fb20.2194.6 +3 -0
- trainer_state.json +16 -16
- training_args.bin +1 -1
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 441154988
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b28070514a109f4c6d0cc6bd89ef87ea76348c26aa37d820b2eae9f6195c9738
|
3 |
size 441154988
|
runs/Jun15_00-36-15_92b2e0e6fb20/events.out.tfevents.1749947776.92b2e0e6fb20.2194.3
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:079f4dbb466565a0431e8d93f99f888ff9e82d727edf190150726236219a2b76
|
3 |
+
size 5717
|
runs/Jun15_00-36-38_92b2e0e6fb20/events.out.tfevents.1749947875.92b2e0e6fb20.2194.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04ffe1a33d90bbbfe16f83cd44b5ae14ccb0afef611397e6a0dc4dbbdcdaa40
|
3 |
+
size 1576
|
runs/Jun15_00-38-20_92b2e0e6fb20/events.out.tfevents.1749947901.92b2e0e6fb20.2194.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80235aca5bb0dd08f3e6284a80b3b9bd4ea63ff47c20ab63860a05bdf5217df3
|
3 |
+
size 7232
|
trainer_state.json
CHANGED
@@ -12,40 +12,40 @@
|
|
12 |
{
|
13 |
"epoch": 0,
|
14 |
"step": 0,
|
15 |
-
"train/classification_loss": 0.
|
16 |
-
"train/contrastive_loss":
|
17 |
-
"train/negative_loss":
|
18 |
"train/num_negatives": 190,
|
19 |
"train/num_positives": 50,
|
20 |
-
"train/positive_loss": 0.
|
21 |
-
"train/total_loss": 2.
|
22 |
},
|
23 |
{
|
24 |
"epoch": 0,
|
25 |
"step": 0,
|
26 |
-
"train/classification_loss": 0.
|
27 |
-
"train/contrastive_loss": 6.
|
28 |
-
"train/negative_loss": 6.
|
29 |
"train/num_negatives": 192,
|
30 |
"train/num_positives": 48,
|
31 |
-
"train/positive_loss": 0.
|
32 |
-
"train/total_loss": 2.
|
33 |
},
|
34 |
{
|
35 |
"epoch": 5.0,
|
36 |
-
"grad_norm":
|
37 |
"learning_rate": 9.800000000000001e-06,
|
38 |
-
"loss":
|
39 |
"step": 50
|
40 |
},
|
41 |
{
|
42 |
"epoch": 5.0,
|
43 |
"step": 50,
|
44 |
"total_flos": 0.0,
|
45 |
-
"train_loss":
|
46 |
-
"train_runtime":
|
47 |
-
"train_samples_per_second":
|
48 |
-
"train_steps_per_second": 1.
|
49 |
}
|
50 |
],
|
51 |
"logging_steps": 50,
|
|
|
12 |
{
|
13 |
"epoch": 0,
|
14 |
"step": 0,
|
15 |
+
"train/classification_loss": 0.6832770109176636,
|
16 |
+
"train/contrastive_loss": 7.157876014709473,
|
17 |
+
"train/negative_loss": 7.157375812530518,
|
18 |
"train/num_negatives": 190,
|
19 |
"train/num_positives": 50,
|
20 |
+
"train/positive_loss": 0.0005001117824576795,
|
21 |
+
"train/total_loss": 2.1148521900177
|
22 |
},
|
23 |
{
|
24 |
"epoch": 0,
|
25 |
"step": 0,
|
26 |
+
"train/classification_loss": 0.691846489906311,
|
27 |
+
"train/contrastive_loss": 6.978695392608643,
|
28 |
+
"train/negative_loss": 6.977847576141357,
|
29 |
"train/num_negatives": 192,
|
30 |
"train/num_positives": 48,
|
31 |
+
"train/positive_loss": 0.0008476818911731243,
|
32 |
+
"train/total_loss": 2.08758544921875
|
33 |
},
|
34 |
{
|
35 |
"epoch": 5.0,
|
36 |
+
"grad_norm": 9.853194236755371,
|
37 |
"learning_rate": 9.800000000000001e-06,
|
38 |
+
"loss": 2.9901,
|
39 |
"step": 50
|
40 |
},
|
41 |
{
|
42 |
"epoch": 5.0,
|
43 |
"step": 50,
|
44 |
"total_flos": 0.0,
|
45 |
+
"train_loss": 2.9900537109375,
|
46 |
+
"train_runtime": 27.9302,
|
47 |
+
"train_samples_per_second": 56.57,
|
48 |
+
"train_steps_per_second": 1.79
|
49 |
}
|
50 |
],
|
51 |
"logging_steps": 50,
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5368
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c02a3dbfbd9db3f1e4a919c78948efb8eb944344dc26585f19fc5dded995095b
|
3 |
size 5368
|