Harsh1729 commited on
Commit
8c588a3
·
verified ·
1 Parent(s): 407deb0

Initial push of retrained model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +131 -0
  2. README.md +59 -0
  3. all_results.json +9 -0
  4. checkpoint-71/optimizer_0/.metadata +3 -0
  5. checkpoint-71/optimizer_0/__0_0.distcp +3 -0
  6. checkpoint-71/optimizer_0/__10_0.distcp +3 -0
  7. checkpoint-71/optimizer_0/__11_0.distcp +3 -0
  8. checkpoint-71/optimizer_0/__12_0.distcp +3 -0
  9. checkpoint-71/optimizer_0/__13_0.distcp +3 -0
  10. checkpoint-71/optimizer_0/__14_0.distcp +3 -0
  11. checkpoint-71/optimizer_0/__15_0.distcp +3 -0
  12. checkpoint-71/optimizer_0/__16_0.distcp +3 -0
  13. checkpoint-71/optimizer_0/__17_0.distcp +3 -0
  14. checkpoint-71/optimizer_0/__18_0.distcp +3 -0
  15. checkpoint-71/optimizer_0/__19_0.distcp +3 -0
  16. checkpoint-71/optimizer_0/__1_0.distcp +3 -0
  17. checkpoint-71/optimizer_0/__20_0.distcp +3 -0
  18. checkpoint-71/optimizer_0/__21_0.distcp +3 -0
  19. checkpoint-71/optimizer_0/__22_0.distcp +3 -0
  20. checkpoint-71/optimizer_0/__23_0.distcp +3 -0
  21. checkpoint-71/optimizer_0/__24_0.distcp +3 -0
  22. checkpoint-71/optimizer_0/__25_0.distcp +3 -0
  23. checkpoint-71/optimizer_0/__26_0.distcp +3 -0
  24. checkpoint-71/optimizer_0/__27_0.distcp +3 -0
  25. checkpoint-71/optimizer_0/__28_0.distcp +3 -0
  26. checkpoint-71/optimizer_0/__29_0.distcp +3 -0
  27. checkpoint-71/optimizer_0/__2_0.distcp +3 -0
  28. checkpoint-71/optimizer_0/__30_0.distcp +3 -0
  29. checkpoint-71/optimizer_0/__31_0.distcp +3 -0
  30. checkpoint-71/optimizer_0/__32_0.distcp +3 -0
  31. checkpoint-71/optimizer_0/__33_0.distcp +3 -0
  32. checkpoint-71/optimizer_0/__34_0.distcp +3 -0
  33. checkpoint-71/optimizer_0/__35_0.distcp +3 -0
  34. checkpoint-71/optimizer_0/__36_0.distcp +3 -0
  35. checkpoint-71/optimizer_0/__37_0.distcp +3 -0
  36. checkpoint-71/optimizer_0/__38_0.distcp +3 -0
  37. checkpoint-71/optimizer_0/__39_0.distcp +3 -0
  38. checkpoint-71/optimizer_0/__3_0.distcp +3 -0
  39. checkpoint-71/optimizer_0/__40_0.distcp +3 -0
  40. checkpoint-71/optimizer_0/__41_0.distcp +3 -0
  41. checkpoint-71/optimizer_0/__42_0.distcp +3 -0
  42. checkpoint-71/optimizer_0/__43_0.distcp +3 -0
  43. checkpoint-71/optimizer_0/__44_0.distcp +3 -0
  44. checkpoint-71/optimizer_0/__45_0.distcp +3 -0
  45. checkpoint-71/optimizer_0/__46_0.distcp +3 -0
  46. checkpoint-71/optimizer_0/__47_0.distcp +3 -0
  47. checkpoint-71/optimizer_0/__48_0.distcp +3 -0
  48. checkpoint-71/optimizer_0/__49_0.distcp +3 -0
  49. checkpoint-71/optimizer_0/__4_0.distcp +3 -0
  50. checkpoint-71/optimizer_0/__50_0.distcp +3 -0
.gitattributes CHANGED
@@ -33,3 +33,134 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ checkpoint-71/optimizer_0/.metadata filter=lfs diff=lfs merge=lfs -text
37
+ checkpoint-71/optimizer_0/__0_0.distcp filter=lfs diff=lfs merge=lfs -text
38
+ checkpoint-71/optimizer_0/__10_0.distcp filter=lfs diff=lfs merge=lfs -text
39
+ checkpoint-71/optimizer_0/__11_0.distcp filter=lfs diff=lfs merge=lfs -text
40
+ checkpoint-71/optimizer_0/__12_0.distcp filter=lfs diff=lfs merge=lfs -text
41
+ checkpoint-71/optimizer_0/__13_0.distcp filter=lfs diff=lfs merge=lfs -text
42
+ checkpoint-71/optimizer_0/__14_0.distcp filter=lfs diff=lfs merge=lfs -text
43
+ checkpoint-71/optimizer_0/__15_0.distcp filter=lfs diff=lfs merge=lfs -text
44
+ checkpoint-71/optimizer_0/__16_0.distcp filter=lfs diff=lfs merge=lfs -text
45
+ checkpoint-71/optimizer_0/__17_0.distcp filter=lfs diff=lfs merge=lfs -text
46
+ checkpoint-71/optimizer_0/__18_0.distcp filter=lfs diff=lfs merge=lfs -text
47
+ checkpoint-71/optimizer_0/__19_0.distcp filter=lfs diff=lfs merge=lfs -text
48
+ checkpoint-71/optimizer_0/__1_0.distcp filter=lfs diff=lfs merge=lfs -text
49
+ checkpoint-71/optimizer_0/__20_0.distcp filter=lfs diff=lfs merge=lfs -text
50
+ checkpoint-71/optimizer_0/__21_0.distcp filter=lfs diff=lfs merge=lfs -text
51
+ checkpoint-71/optimizer_0/__22_0.distcp filter=lfs diff=lfs merge=lfs -text
52
+ checkpoint-71/optimizer_0/__23_0.distcp filter=lfs diff=lfs merge=lfs -text
53
+ checkpoint-71/optimizer_0/__24_0.distcp filter=lfs diff=lfs merge=lfs -text
54
+ checkpoint-71/optimizer_0/__25_0.distcp filter=lfs diff=lfs merge=lfs -text
55
+ checkpoint-71/optimizer_0/__26_0.distcp filter=lfs diff=lfs merge=lfs -text
56
+ checkpoint-71/optimizer_0/__27_0.distcp filter=lfs diff=lfs merge=lfs -text
57
+ checkpoint-71/optimizer_0/__28_0.distcp filter=lfs diff=lfs merge=lfs -text
58
+ checkpoint-71/optimizer_0/__29_0.distcp filter=lfs diff=lfs merge=lfs -text
59
+ checkpoint-71/optimizer_0/__2_0.distcp filter=lfs diff=lfs merge=lfs -text
60
+ checkpoint-71/optimizer_0/__30_0.distcp filter=lfs diff=lfs merge=lfs -text
61
+ checkpoint-71/optimizer_0/__31_0.distcp filter=lfs diff=lfs merge=lfs -text
62
+ checkpoint-71/optimizer_0/__32_0.distcp filter=lfs diff=lfs merge=lfs -text
63
+ checkpoint-71/optimizer_0/__33_0.distcp filter=lfs diff=lfs merge=lfs -text
64
+ checkpoint-71/optimizer_0/__34_0.distcp filter=lfs diff=lfs merge=lfs -text
65
+ checkpoint-71/optimizer_0/__35_0.distcp filter=lfs diff=lfs merge=lfs -text
66
+ checkpoint-71/optimizer_0/__36_0.distcp filter=lfs diff=lfs merge=lfs -text
67
+ checkpoint-71/optimizer_0/__37_0.distcp filter=lfs diff=lfs merge=lfs -text
68
+ checkpoint-71/optimizer_0/__38_0.distcp filter=lfs diff=lfs merge=lfs -text
69
+ checkpoint-71/optimizer_0/__39_0.distcp filter=lfs diff=lfs merge=lfs -text
70
+ checkpoint-71/optimizer_0/__3_0.distcp filter=lfs diff=lfs merge=lfs -text
71
+ checkpoint-71/optimizer_0/__40_0.distcp filter=lfs diff=lfs merge=lfs -text
72
+ checkpoint-71/optimizer_0/__41_0.distcp filter=lfs diff=lfs merge=lfs -text
73
+ checkpoint-71/optimizer_0/__42_0.distcp filter=lfs diff=lfs merge=lfs -text
74
+ checkpoint-71/optimizer_0/__43_0.distcp filter=lfs diff=lfs merge=lfs -text
75
+ checkpoint-71/optimizer_0/__44_0.distcp filter=lfs diff=lfs merge=lfs -text
76
+ checkpoint-71/optimizer_0/__45_0.distcp filter=lfs diff=lfs merge=lfs -text
77
+ checkpoint-71/optimizer_0/__46_0.distcp filter=lfs diff=lfs merge=lfs -text
78
+ checkpoint-71/optimizer_0/__47_0.distcp filter=lfs diff=lfs merge=lfs -text
79
+ checkpoint-71/optimizer_0/__48_0.distcp filter=lfs diff=lfs merge=lfs -text
80
+ checkpoint-71/optimizer_0/__49_0.distcp filter=lfs diff=lfs merge=lfs -text
81
+ checkpoint-71/optimizer_0/__4_0.distcp filter=lfs diff=lfs merge=lfs -text
82
+ checkpoint-71/optimizer_0/__50_0.distcp filter=lfs diff=lfs merge=lfs -text
83
+ checkpoint-71/optimizer_0/__51_0.distcp filter=lfs diff=lfs merge=lfs -text
84
+ checkpoint-71/optimizer_0/__52_0.distcp filter=lfs diff=lfs merge=lfs -text
85
+ checkpoint-71/optimizer_0/__53_0.distcp filter=lfs diff=lfs merge=lfs -text
86
+ checkpoint-71/optimizer_0/__54_0.distcp filter=lfs diff=lfs merge=lfs -text
87
+ checkpoint-71/optimizer_0/__55_0.distcp filter=lfs diff=lfs merge=lfs -text
88
+ checkpoint-71/optimizer_0/__56_0.distcp filter=lfs diff=lfs merge=lfs -text
89
+ checkpoint-71/optimizer_0/__57_0.distcp filter=lfs diff=lfs merge=lfs -text
90
+ checkpoint-71/optimizer_0/__58_0.distcp filter=lfs diff=lfs merge=lfs -text
91
+ checkpoint-71/optimizer_0/__59_0.distcp filter=lfs diff=lfs merge=lfs -text
92
+ checkpoint-71/optimizer_0/__5_0.distcp filter=lfs diff=lfs merge=lfs -text
93
+ checkpoint-71/optimizer_0/__60_0.distcp filter=lfs diff=lfs merge=lfs -text
94
+ checkpoint-71/optimizer_0/__61_0.distcp filter=lfs diff=lfs merge=lfs -text
95
+ checkpoint-71/optimizer_0/__62_0.distcp filter=lfs diff=lfs merge=lfs -text
96
+ checkpoint-71/optimizer_0/__63_0.distcp filter=lfs diff=lfs merge=lfs -text
97
+ checkpoint-71/optimizer_0/__6_0.distcp filter=lfs diff=lfs merge=lfs -text
98
+ checkpoint-71/optimizer_0/__7_0.distcp filter=lfs diff=lfs merge=lfs -text
99
+ checkpoint-71/optimizer_0/__8_0.distcp filter=lfs diff=lfs merge=lfs -text
100
+ checkpoint-71/optimizer_0/__9_0.distcp filter=lfs diff=lfs merge=lfs -text
101
+ checkpoint-71/pytorch_model_fsdp_0/.metadata filter=lfs diff=lfs merge=lfs -text
102
+ checkpoint-71/pytorch_model_fsdp_0/__0_0.distcp filter=lfs diff=lfs merge=lfs -text
103
+ checkpoint-71/pytorch_model_fsdp_0/__10_0.distcp filter=lfs diff=lfs merge=lfs -text
104
+ checkpoint-71/pytorch_model_fsdp_0/__11_0.distcp filter=lfs diff=lfs merge=lfs -text
105
+ checkpoint-71/pytorch_model_fsdp_0/__12_0.distcp filter=lfs diff=lfs merge=lfs -text
106
+ checkpoint-71/pytorch_model_fsdp_0/__13_0.distcp filter=lfs diff=lfs merge=lfs -text
107
+ checkpoint-71/pytorch_model_fsdp_0/__14_0.distcp filter=lfs diff=lfs merge=lfs -text
108
+ checkpoint-71/pytorch_model_fsdp_0/__15_0.distcp filter=lfs diff=lfs merge=lfs -text
109
+ checkpoint-71/pytorch_model_fsdp_0/__16_0.distcp filter=lfs diff=lfs merge=lfs -text
110
+ checkpoint-71/pytorch_model_fsdp_0/__17_0.distcp filter=lfs diff=lfs merge=lfs -text
111
+ checkpoint-71/pytorch_model_fsdp_0/__18_0.distcp filter=lfs diff=lfs merge=lfs -text
112
+ checkpoint-71/pytorch_model_fsdp_0/__19_0.distcp filter=lfs diff=lfs merge=lfs -text
113
+ checkpoint-71/pytorch_model_fsdp_0/__1_0.distcp filter=lfs diff=lfs merge=lfs -text
114
+ checkpoint-71/pytorch_model_fsdp_0/__20_0.distcp filter=lfs diff=lfs merge=lfs -text
115
+ checkpoint-71/pytorch_model_fsdp_0/__21_0.distcp filter=lfs diff=lfs merge=lfs -text
116
+ checkpoint-71/pytorch_model_fsdp_0/__22_0.distcp filter=lfs diff=lfs merge=lfs -text
117
+ checkpoint-71/pytorch_model_fsdp_0/__23_0.distcp filter=lfs diff=lfs merge=lfs -text
118
+ checkpoint-71/pytorch_model_fsdp_0/__24_0.distcp filter=lfs diff=lfs merge=lfs -text
119
+ checkpoint-71/pytorch_model_fsdp_0/__25_0.distcp filter=lfs diff=lfs merge=lfs -text
120
+ checkpoint-71/pytorch_model_fsdp_0/__26_0.distcp filter=lfs diff=lfs merge=lfs -text
121
+ checkpoint-71/pytorch_model_fsdp_0/__27_0.distcp filter=lfs diff=lfs merge=lfs -text
122
+ checkpoint-71/pytorch_model_fsdp_0/__28_0.distcp filter=lfs diff=lfs merge=lfs -text
123
+ checkpoint-71/pytorch_model_fsdp_0/__29_0.distcp filter=lfs diff=lfs merge=lfs -text
124
+ checkpoint-71/pytorch_model_fsdp_0/__2_0.distcp filter=lfs diff=lfs merge=lfs -text
125
+ checkpoint-71/pytorch_model_fsdp_0/__30_0.distcp filter=lfs diff=lfs merge=lfs -text
126
+ checkpoint-71/pytorch_model_fsdp_0/__31_0.distcp filter=lfs diff=lfs merge=lfs -text
127
+ checkpoint-71/pytorch_model_fsdp_0/__32_0.distcp filter=lfs diff=lfs merge=lfs -text
128
+ checkpoint-71/pytorch_model_fsdp_0/__33_0.distcp filter=lfs diff=lfs merge=lfs -text
129
+ checkpoint-71/pytorch_model_fsdp_0/__34_0.distcp filter=lfs diff=lfs merge=lfs -text
130
+ checkpoint-71/pytorch_model_fsdp_0/__35_0.distcp filter=lfs diff=lfs merge=lfs -text
131
+ checkpoint-71/pytorch_model_fsdp_0/__36_0.distcp filter=lfs diff=lfs merge=lfs -text
132
+ checkpoint-71/pytorch_model_fsdp_0/__37_0.distcp filter=lfs diff=lfs merge=lfs -text
133
+ checkpoint-71/pytorch_model_fsdp_0/__38_0.distcp filter=lfs diff=lfs merge=lfs -text
134
+ checkpoint-71/pytorch_model_fsdp_0/__39_0.distcp filter=lfs diff=lfs merge=lfs -text
135
+ checkpoint-71/pytorch_model_fsdp_0/__3_0.distcp filter=lfs diff=lfs merge=lfs -text
136
+ checkpoint-71/pytorch_model_fsdp_0/__40_0.distcp filter=lfs diff=lfs merge=lfs -text
137
+ checkpoint-71/pytorch_model_fsdp_0/__41_0.distcp filter=lfs diff=lfs merge=lfs -text
138
+ checkpoint-71/pytorch_model_fsdp_0/__42_0.distcp filter=lfs diff=lfs merge=lfs -text
139
+ checkpoint-71/pytorch_model_fsdp_0/__43_0.distcp filter=lfs diff=lfs merge=lfs -text
140
+ checkpoint-71/pytorch_model_fsdp_0/__44_0.distcp filter=lfs diff=lfs merge=lfs -text
141
+ checkpoint-71/pytorch_model_fsdp_0/__45_0.distcp filter=lfs diff=lfs merge=lfs -text
142
+ checkpoint-71/pytorch_model_fsdp_0/__46_0.distcp filter=lfs diff=lfs merge=lfs -text
143
+ checkpoint-71/pytorch_model_fsdp_0/__47_0.distcp filter=lfs diff=lfs merge=lfs -text
144
+ checkpoint-71/pytorch_model_fsdp_0/__48_0.distcp filter=lfs diff=lfs merge=lfs -text
145
+ checkpoint-71/pytorch_model_fsdp_0/__49_0.distcp filter=lfs diff=lfs merge=lfs -text
146
+ checkpoint-71/pytorch_model_fsdp_0/__4_0.distcp filter=lfs diff=lfs merge=lfs -text
147
+ checkpoint-71/pytorch_model_fsdp_0/__50_0.distcp filter=lfs diff=lfs merge=lfs -text
148
+ checkpoint-71/pytorch_model_fsdp_0/__51_0.distcp filter=lfs diff=lfs merge=lfs -text
149
+ checkpoint-71/pytorch_model_fsdp_0/__52_0.distcp filter=lfs diff=lfs merge=lfs -text
150
+ checkpoint-71/pytorch_model_fsdp_0/__53_0.distcp filter=lfs diff=lfs merge=lfs -text
151
+ checkpoint-71/pytorch_model_fsdp_0/__54_0.distcp filter=lfs diff=lfs merge=lfs -text
152
+ checkpoint-71/pytorch_model_fsdp_0/__55_0.distcp filter=lfs diff=lfs merge=lfs -text
153
+ checkpoint-71/pytorch_model_fsdp_0/__56_0.distcp filter=lfs diff=lfs merge=lfs -text
154
+ checkpoint-71/pytorch_model_fsdp_0/__57_0.distcp filter=lfs diff=lfs merge=lfs -text
155
+ checkpoint-71/pytorch_model_fsdp_0/__58_0.distcp filter=lfs diff=lfs merge=lfs -text
156
+ checkpoint-71/pytorch_model_fsdp_0/__59_0.distcp filter=lfs diff=lfs merge=lfs -text
157
+ checkpoint-71/pytorch_model_fsdp_0/__5_0.distcp filter=lfs diff=lfs merge=lfs -text
158
+ checkpoint-71/pytorch_model_fsdp_0/__60_0.distcp filter=lfs diff=lfs merge=lfs -text
159
+ checkpoint-71/pytorch_model_fsdp_0/__61_0.distcp filter=lfs diff=lfs merge=lfs -text
160
+ checkpoint-71/pytorch_model_fsdp_0/__62_0.distcp filter=lfs diff=lfs merge=lfs -text
161
+ checkpoint-71/pytorch_model_fsdp_0/__63_0.distcp filter=lfs diff=lfs merge=lfs -text
162
+ checkpoint-71/pytorch_model_fsdp_0/__6_0.distcp filter=lfs diff=lfs merge=lfs -text
163
+ checkpoint-71/pytorch_model_fsdp_0/__7_0.distcp filter=lfs diff=lfs merge=lfs -text
164
+ checkpoint-71/pytorch_model_fsdp_0/__8_0.distcp filter=lfs diff=lfs merge=lfs -text
165
+ checkpoint-71/pytorch_model_fsdp_0/__9_0.distcp filter=lfs diff=lfs merge=lfs -text
166
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: deepseek-ai/DeepSeek-R1-Distill-Llama-8B
3
+ library_name: transformers
4
+ model_name:
5
+ tags:
6
+ - sft
7
+ - full-finetuning
8
+ tags:
9
+ - generated_from_trainer
10
+ licence: license
11
+ ---
12
+
13
+ # Model Card for {'tags': ['sft', 'full-finetuning']}
14
+
15
+ This model is a fine-tuned version of [deepseek-ai/DeepSeek-R1-Distill-Llama-8B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Llama-8B).
16
+ It has been trained using [TRL](https://github.com/huggingface/trl).
17
+
18
+ ## Quick start
19
+
20
+ ```python
21
+ from transformers import pipeline
22
+
23
+ question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
24
+ generator = pipeline("text-generation", model="None", device="cuda")
25
+ output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
26
+ print(output["generated_text"])
27
+ ```
28
+
29
+ ## Training procedure
30
+
31
+
32
+
33
+
34
+ This model was trained with SFT.
35
+
36
+ ### Framework versions
37
+
38
+ - TRL: 0.13.0
39
+ - Transformers: 4.46.0
40
+ - Pytorch: 2.4.0
41
+ - Datasets: 3.2.0
42
+ - Tokenizers: 0.20.1
43
+
44
+ ## Citations
45
+
46
+
47
+
48
+ Cite TRL as:
49
+
50
+ ```bibtex
51
+ @misc{vonwerra2022trl,
52
+ title = {{TRL: Transformer Reinforcement Learning}},
53
+ author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallouédec},
54
+ year = 2020,
55
+ journal = {GitHub repository},
56
+ publisher = {GitHub},
57
+ howpublished = {\url{https://github.com/huggingface/trl}}
58
+ }
59
+ ```
all_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 0.993006993006993,
3
+ "total_flos": 1.6814365427000934e+17,
4
+ "train_loss": 1.0495624525446288,
5
+ "train_runtime": 12091.2309,
6
+ "train_samples": 43759,
7
+ "train_samples_per_second": 4.529,
8
+ "train_steps_per_second": 0.006
9
+ }
checkpoint-71/optimizer_0/.metadata ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b543975e32cfc638b69de6f3f0efce4a329a1bffd016ddf13ab49dd14cba34a7
3
+ size 7326437
checkpoint-71/optimizer_0/__0_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0cec445fc052f47619083c7f5e8b7d85afb9f2cceda069ba212de63052123aa
3
+ size 1004469416
checkpoint-71/optimizer_0/__10_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec98c4330115322acd50987209d2255f0e6faf7a178e844367bbe31282986b2a
3
+ size 1004475316
checkpoint-71/optimizer_0/__11_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27b1c34d0a6b6c4660dba9ab5a5ed8efed5dd7051e3033cd893b9a04971dde84
3
+ size 1004475316
checkpoint-71/optimizer_0/__12_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7619afac97039abcd17e59a74773fabe38fdef20954a98d00af294420e5c2a5a
3
+ size 1004475316
checkpoint-71/optimizer_0/__13_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:603eee538d85aceb9012de4c9c2a2d1836d95e1d05767b2f373c981e3f1a871c
3
+ size 1004475316
checkpoint-71/optimizer_0/__14_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:908ec24e148aa120e255599f666061aa00046eb8d6a4f17adb22195d5d9fbf2e
3
+ size 1004475316
checkpoint-71/optimizer_0/__15_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0442bcb7c394360107abd08add7aa7dab0a2b57a6ab350f001132996b4bd3045
3
+ size 1004475316
checkpoint-71/optimizer_0/__16_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c87a403ba95856910c39a9c98c910d00187611392a287ee46a02e3bc9324fe4
3
+ size 1004475316
checkpoint-71/optimizer_0/__17_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7223d78deacc58c93cec8a1f081d7afe2e7b7e9b3c7a65285222375e7d68e3b
3
+ size 1004475316
checkpoint-71/optimizer_0/__18_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c1275bc9ad19f5f587fff8f93d9b25f914d7de5231dbd93a374922ffb6c2381
3
+ size 1004475316
checkpoint-71/optimizer_0/__19_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2116388a557a68f97a78ea1fa18266f473d4286c9d59f4afb56153c600c04dad
3
+ size 1004475316
checkpoint-71/optimizer_0/__1_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad242006b33e0307ccbb9d1f76e163517e6be79a734ec02569e62f6bcc4bb690
3
+ size 1004475316
checkpoint-71/optimizer_0/__20_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0c44e59a58a2675bd697b763f349cc6762fd2b97b3cbe9d6018b6f4a00ef947
3
+ size 1004475316
checkpoint-71/optimizer_0/__21_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9081ac24f52d114eb82b6279e675f60472efa96c186253085fa7ca13c655673
3
+ size 1004475316
checkpoint-71/optimizer_0/__22_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97b99215abb812eb2d5a65c3279acefa3f8ad99223ef53bd05c783bb2bec624e
3
+ size 1004475316
checkpoint-71/optimizer_0/__23_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a62ed26cfb5a9f94a0f774f6671935762a467f72cba37e54b18af5ef38bf2d5
3
+ size 1004475316
checkpoint-71/optimizer_0/__24_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:050b7939615da96106772afc82a2cd9567028ae93932563b5321bafe18cbe1fa
3
+ size 1004475316
checkpoint-71/optimizer_0/__25_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aec6361ee1502f89430f1ffddd3abb5b7383fd37933ab90e01b361ef2835b9c
3
+ size 1004475316
checkpoint-71/optimizer_0/__26_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:600f232035946120ac1390f57021a34f17bea2d5dfd805d9a4e83a3964ec6995
3
+ size 1004475316
checkpoint-71/optimizer_0/__27_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd883db282faed4c2b4cc7658afb59d68d60d1d2c0a6b91aa1ea47638414b91a
3
+ size 1004475316
checkpoint-71/optimizer_0/__28_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9098c47787db85588e8ec5368a55329482d739eff6681a7fc50b575ef8e58ed4
3
+ size 1004475316
checkpoint-71/optimizer_0/__29_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa671264a735d0e8bcfed175b877cfc31e9f789e7f53f319c71908e0768f43e7
3
+ size 1004475316
checkpoint-71/optimizer_0/__2_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0ee2fadd77b89fba0684dcfd30a88cc7a567af8a64f97368ede8964d2af3fb6
3
+ size 1004475316
checkpoint-71/optimizer_0/__30_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a042ab745adbc8330594cd861d6020e2c40bc8a45742926263425a4c329173f
3
+ size 1004475316
checkpoint-71/optimizer_0/__31_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49ed97969b385229ca5dba05fc00a8e1a8bb715bafde0aefc9adde7ea6f78600
3
+ size 1004475316
checkpoint-71/optimizer_0/__32_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff73360edc4f49e98c9c1ee8b2adcb3d1e4e9a03349912484d6765058cb17f7e
3
+ size 1004475316
checkpoint-71/optimizer_0/__33_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa8ad1a4d67e0f243cf0eddb302dd524e66027ed3ad05e6f25adca2f7de28f2d
3
+ size 1004475316
checkpoint-71/optimizer_0/__34_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3cb88e4f2e27a4e228786f3d91f7a660a51feb3def2d001c0bf2db519b7732c
3
+ size 1004475316
checkpoint-71/optimizer_0/__35_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9eafdba6d23a43d868da37bfb3c5b9de2140ceb46e9c4ecfafb6529841dbe56
3
+ size 1004475316
checkpoint-71/optimizer_0/__36_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2817bb28216be7795ceff9d86092df0deff15ed54a78332d7c2425255c3cab48
3
+ size 1004475316
checkpoint-71/optimizer_0/__37_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf362a32f842c01c36ffb2a999d9ab26554bd8afef72ad0a3b7c464c5df760e8
3
+ size 1004475316
checkpoint-71/optimizer_0/__38_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63def0f1361594d2192d24c0eeabb1959ad022413c0cb0e37673f303d903f6e7
3
+ size 1004475316
checkpoint-71/optimizer_0/__39_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30be6d7cacb28ef8f695cdd7eb98d778d4762de1999291da73920cd4e065f265
3
+ size 1004475316
checkpoint-71/optimizer_0/__3_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:948002b45c957d1b19a2a9416c67f9b10d5bfd32af440486f8b970560cf9a5d2
3
+ size 1004475316
checkpoint-71/optimizer_0/__40_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb12ad38a29bdabcbadd4a33ece7f0191c40c9af33e840b4f18c3eef6d5f431f
3
+ size 1004475000
checkpoint-71/optimizer_0/__41_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd777702ce109ff00d2f0830586c00a3e64eb78b88441f50329e8854e26929f3
3
+ size 1004475000
checkpoint-71/optimizer_0/__42_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63df45d6a488d04e261c75ada2c7f5c4d4151d1f716890f8d6af3d254dbc6297
3
+ size 1004475000
checkpoint-71/optimizer_0/__43_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb4f9daaff7e3b0d8fe85d6acfac683808c879669c394568b6ef6024582dfd4f
3
+ size 1004475000
checkpoint-71/optimizer_0/__44_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2ed8d095dd9ca0d577e596fa5b82e203914a77cf5325084ce50bb6af08fac65
3
+ size 1004475000
checkpoint-71/optimizer_0/__45_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be2ffc9df0516a623f0701d35540e40d7984a09256e13cc773f68e78a755b06d
3
+ size 1004475000
checkpoint-71/optimizer_0/__46_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:767f4bab783673cb96ab4373f6ada658e0d10cd58bc84f6219b0e18537251e16
3
+ size 1004475000
checkpoint-71/optimizer_0/__47_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea8b772a1fdb14eb190b915d6602c1ebc66c3cc2187b64423bd4048ee2312a95
3
+ size 1004475000
checkpoint-71/optimizer_0/__48_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1515228871e89e286700857a9123d5c1f3bf732f227847c67ea802f8766ff90
3
+ size 1004475000
checkpoint-71/optimizer_0/__49_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd133e09b4e511ea9d4b229b446a8fc1725d30953caedb6f12f42e96449c07ed
3
+ size 1004475000
checkpoint-71/optimizer_0/__4_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10fda3d3a2d843c1d5098d2ee1d25d2a6daf8ddaafdec9d7aa16d02157aff752
3
+ size 1004475316
checkpoint-71/optimizer_0/__50_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d03cab7298b118ce7b75a57aed37085bba683771317a6a758f318634536945d
3
+ size 1004475000