lukahh commited on
Commit
f8b2633
·
verified ·
1 Parent(s): 406ac44

End of training

Browse files
Files changed (6) hide show
  1. README.md +2 -0
  2. all_results.json +10 -10
  3. eval_results.json +5 -5
  4. tokenizer.json +2 -16
  5. train_results.json +6 -6
  6. trainer_state.json +32 -18
README.md CHANGED
@@ -14,6 +14,8 @@ should probably proofread and complete it, then remove this comment. -->
14
  # cultureclip_sd_0226
15
 
16
  This model is a fine-tuned version of [openai/clip-vit-large-patch14](https://huggingface.co/openai/clip-vit-large-patch14) on an unknown dataset.
 
 
17
 
18
  ## Model description
19
 
 
14
  # cultureclip_sd_0226
15
 
16
  This model is a fine-tuned version of [openai/clip-vit-large-patch14](https://huggingface.co/openai/clip-vit-large-patch14) on an unknown dataset.
17
+ It achieves the following results on the evaluation set:
18
+ - Loss: 0.0008
19
 
20
  ## Model description
21
 
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 10.0,
3
- "eval_loss": 0.00021045817993581295,
4
- "eval_runtime": 2.7761,
5
- "eval_samples_per_second": 20.172,
6
- "eval_steps_per_second": 2.521,
7
- "total_flos": 9864573991549200.0,
8
- "train_loss": 0.1267506488533907,
9
- "train_runtime": 3359.5638,
10
- "train_samples_per_second": 16.324,
11
- "train_steps_per_second": 0.256
12
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_loss": 0.0008266960503533483,
4
+ "eval_runtime": 2.8363,
5
+ "eval_samples_per_second": 19.744,
6
+ "eval_steps_per_second": 2.468,
7
+ "total_flos": 4932286995774600.0,
8
+ "train_loss": 0.030539887709103243,
9
+ "train_runtime": 1868.9702,
10
+ "train_samples_per_second": 14.671,
11
+ "train_steps_per_second": 0.918
12
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 10.0,
3
- "eval_loss": 0.00021045817993581295,
4
- "eval_runtime": 2.7761,
5
- "eval_samples_per_second": 20.172,
6
- "eval_steps_per_second": 2.521
7
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_loss": 0.0008266960503533483,
4
+ "eval_runtime": 2.8363,
5
+ "eval_samples_per_second": 19.744,
6
+ "eval_steps_per_second": 2.468
7
  }
tokenizer.json CHANGED
@@ -1,21 +1,7 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 77,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
- "padding": {
10
- "strategy": {
11
- "Fixed": 77
12
- },
13
- "direction": "Right",
14
- "pad_to_multiple_of": null,
15
- "pad_id": 49407,
16
- "pad_type_id": 0,
17
- "pad_token": "<|endoftext|>"
18
- },
19
  "added_tokens": [
20
  {
21
  "id": 49406,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 49406,
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 10.0,
3
- "total_flos": 9864573991549200.0,
4
- "train_loss": 0.1267506488533907,
5
- "train_runtime": 3359.5638,
6
- "train_samples_per_second": 16.324,
7
- "train_steps_per_second": 0.256
8
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "total_flos": 4932286995774600.0,
4
+ "train_loss": 0.030539887709103243,
5
+ "train_runtime": 1868.9702,
6
+ "train_samples_per_second": 14.671,
7
+ "train_steps_per_second": 0.918
8
  }
trainer_state.json CHANGED
@@ -1,34 +1,48 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 10.0,
5
- "eval_steps": 500.0,
6
- "global_step": 860,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 5.813953488372093,
13
- "grad_norm": 5.5346174240112305,
14
- "learning_rate": 3e-05,
15
- "loss": 0.1406,
16
  "step": 500
17
  },
18
  {
19
- "epoch": 10.0,
20
- "step": 860,
21
- "total_flos": 9864573991549200.0,
22
- "train_loss": 0.1267506488533907,
23
- "train_runtime": 3359.5638,
24
- "train_samples_per_second": 16.324,
25
- "train_steps_per_second": 0.256
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  }
27
  ],
28
  "logging_steps": 500,
29
- "max_steps": 860,
30
  "num_input_tokens_seen": 0,
31
- "num_train_epochs": 10,
32
  "save_steps": 500,
33
  "stateful_callbacks": {
34
  "TrainerControl": {
@@ -42,8 +56,8 @@
42
  "attributes": {}
43
  }
44
  },
45
- "total_flos": 9864573991549200.0,
46
- "train_batch_size": 64,
47
  "trial_name": null,
48
  "trial_params": null
49
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 5.0,
5
+ "eval_steps": 200.0,
6
+ "global_step": 1715,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 1.4577259475218658,
13
+ "grad_norm": 0.005862534046173096,
14
+ "learning_rate": 8.01980198019802e-07,
15
+ "loss": 0.0387,
16
  "step": 500
17
  },
18
  {
19
+ "epoch": 2.9154518950437316,
20
+ "grad_norm": 39.22230911254883,
21
+ "learning_rate": 4.7194719471947193e-07,
22
+ "loss": 0.0292,
23
+ "step": 1000
24
+ },
25
+ {
26
+ "epoch": 4.373177842565598,
27
+ "grad_norm": 29.80740737915039,
28
+ "learning_rate": 1.419141914191419e-07,
29
+ "loss": 0.0235,
30
+ "step": 1500
31
+ },
32
+ {
33
+ "epoch": 5.0,
34
+ "step": 1715,
35
+ "total_flos": 4932286995774600.0,
36
+ "train_loss": 0.030539887709103243,
37
+ "train_runtime": 1868.9702,
38
+ "train_samples_per_second": 14.671,
39
+ "train_steps_per_second": 0.918
40
  }
41
  ],
42
  "logging_steps": 500,
43
+ "max_steps": 1715,
44
  "num_input_tokens_seen": 0,
45
+ "num_train_epochs": 5,
46
  "save_steps": 500,
47
  "stateful_callbacks": {
48
  "TrainerControl": {
 
56
  "attributes": {}
57
  }
58
  },
59
+ "total_flos": 4932286995774600.0,
60
+ "train_batch_size": 16,
61
  "trial_name": null,
62
  "trial_params": null
63
  }