Initial push of retrained model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +131 -0
- README.md +59 -0
- all_results.json +9 -0
- checkpoint-71/optimizer_0/.metadata +3 -0
- checkpoint-71/optimizer_0/__0_0.distcp +3 -0
- checkpoint-71/optimizer_0/__10_0.distcp +3 -0
- checkpoint-71/optimizer_0/__11_0.distcp +3 -0
- checkpoint-71/optimizer_0/__12_0.distcp +3 -0
- checkpoint-71/optimizer_0/__13_0.distcp +3 -0
- checkpoint-71/optimizer_0/__14_0.distcp +3 -0
- checkpoint-71/optimizer_0/__15_0.distcp +3 -0
- checkpoint-71/optimizer_0/__16_0.distcp +3 -0
- checkpoint-71/optimizer_0/__17_0.distcp +3 -0
- checkpoint-71/optimizer_0/__18_0.distcp +3 -0
- checkpoint-71/optimizer_0/__19_0.distcp +3 -0
- checkpoint-71/optimizer_0/__1_0.distcp +3 -0
- checkpoint-71/optimizer_0/__20_0.distcp +3 -0
- checkpoint-71/optimizer_0/__21_0.distcp +3 -0
- checkpoint-71/optimizer_0/__22_0.distcp +3 -0
- checkpoint-71/optimizer_0/__23_0.distcp +3 -0
- checkpoint-71/optimizer_0/__24_0.distcp +3 -0
- checkpoint-71/optimizer_0/__25_0.distcp +3 -0
- checkpoint-71/optimizer_0/__26_0.distcp +3 -0
- checkpoint-71/optimizer_0/__27_0.distcp +3 -0
- checkpoint-71/optimizer_0/__28_0.distcp +3 -0
- checkpoint-71/optimizer_0/__29_0.distcp +3 -0
- checkpoint-71/optimizer_0/__2_0.distcp +3 -0
- checkpoint-71/optimizer_0/__30_0.distcp +3 -0
- checkpoint-71/optimizer_0/__31_0.distcp +3 -0
- checkpoint-71/optimizer_0/__32_0.distcp +3 -0
- checkpoint-71/optimizer_0/__33_0.distcp +3 -0
- checkpoint-71/optimizer_0/__34_0.distcp +3 -0
- checkpoint-71/optimizer_0/__35_0.distcp +3 -0
- checkpoint-71/optimizer_0/__36_0.distcp +3 -0
- checkpoint-71/optimizer_0/__37_0.distcp +3 -0
- checkpoint-71/optimizer_0/__38_0.distcp +3 -0
- checkpoint-71/optimizer_0/__39_0.distcp +3 -0
- checkpoint-71/optimizer_0/__3_0.distcp +3 -0
- checkpoint-71/optimizer_0/__40_0.distcp +3 -0
- checkpoint-71/optimizer_0/__41_0.distcp +3 -0
- checkpoint-71/optimizer_0/__42_0.distcp +3 -0
- checkpoint-71/optimizer_0/__43_0.distcp +3 -0
- checkpoint-71/optimizer_0/__44_0.distcp +3 -0
- checkpoint-71/optimizer_0/__45_0.distcp +3 -0
- checkpoint-71/optimizer_0/__46_0.distcp +3 -0
- checkpoint-71/optimizer_0/__47_0.distcp +3 -0
- checkpoint-71/optimizer_0/__48_0.distcp +3 -0
- checkpoint-71/optimizer_0/__49_0.distcp +3 -0
- checkpoint-71/optimizer_0/__4_0.distcp +3 -0
- checkpoint-71/optimizer_0/__50_0.distcp +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,134 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
checkpoint-71/optimizer_0/.metadata filter=lfs diff=lfs merge=lfs -text
|
37 |
+
checkpoint-71/optimizer_0/__0_0.distcp filter=lfs diff=lfs merge=lfs -text
|
38 |
+
checkpoint-71/optimizer_0/__10_0.distcp filter=lfs diff=lfs merge=lfs -text
|
39 |
+
checkpoint-71/optimizer_0/__11_0.distcp filter=lfs diff=lfs merge=lfs -text
|
40 |
+
checkpoint-71/optimizer_0/__12_0.distcp filter=lfs diff=lfs merge=lfs -text
|
41 |
+
checkpoint-71/optimizer_0/__13_0.distcp filter=lfs diff=lfs merge=lfs -text
|
42 |
+
checkpoint-71/optimizer_0/__14_0.distcp filter=lfs diff=lfs merge=lfs -text
|
43 |
+
checkpoint-71/optimizer_0/__15_0.distcp filter=lfs diff=lfs merge=lfs -text
|
44 |
+
checkpoint-71/optimizer_0/__16_0.distcp filter=lfs diff=lfs merge=lfs -text
|
45 |
+
checkpoint-71/optimizer_0/__17_0.distcp filter=lfs diff=lfs merge=lfs -text
|
46 |
+
checkpoint-71/optimizer_0/__18_0.distcp filter=lfs diff=lfs merge=lfs -text
|
47 |
+
checkpoint-71/optimizer_0/__19_0.distcp filter=lfs diff=lfs merge=lfs -text
|
48 |
+
checkpoint-71/optimizer_0/__1_0.distcp filter=lfs diff=lfs merge=lfs -text
|
49 |
+
checkpoint-71/optimizer_0/__20_0.distcp filter=lfs diff=lfs merge=lfs -text
|
50 |
+
checkpoint-71/optimizer_0/__21_0.distcp filter=lfs diff=lfs merge=lfs -text
|
51 |
+
checkpoint-71/optimizer_0/__22_0.distcp filter=lfs diff=lfs merge=lfs -text
|
52 |
+
checkpoint-71/optimizer_0/__23_0.distcp filter=lfs diff=lfs merge=lfs -text
|
53 |
+
checkpoint-71/optimizer_0/__24_0.distcp filter=lfs diff=lfs merge=lfs -text
|
54 |
+
checkpoint-71/optimizer_0/__25_0.distcp filter=lfs diff=lfs merge=lfs -text
|
55 |
+
checkpoint-71/optimizer_0/__26_0.distcp filter=lfs diff=lfs merge=lfs -text
|
56 |
+
checkpoint-71/optimizer_0/__27_0.distcp filter=lfs diff=lfs merge=lfs -text
|
57 |
+
checkpoint-71/optimizer_0/__28_0.distcp filter=lfs diff=lfs merge=lfs -text
|
58 |
+
checkpoint-71/optimizer_0/__29_0.distcp filter=lfs diff=lfs merge=lfs -text
|
59 |
+
checkpoint-71/optimizer_0/__2_0.distcp filter=lfs diff=lfs merge=lfs -text
|
60 |
+
checkpoint-71/optimizer_0/__30_0.distcp filter=lfs diff=lfs merge=lfs -text
|
61 |
+
checkpoint-71/optimizer_0/__31_0.distcp filter=lfs diff=lfs merge=lfs -text
|
62 |
+
checkpoint-71/optimizer_0/__32_0.distcp filter=lfs diff=lfs merge=lfs -text
|
63 |
+
checkpoint-71/optimizer_0/__33_0.distcp filter=lfs diff=lfs merge=lfs -text
|
64 |
+
checkpoint-71/optimizer_0/__34_0.distcp filter=lfs diff=lfs merge=lfs -text
|
65 |
+
checkpoint-71/optimizer_0/__35_0.distcp filter=lfs diff=lfs merge=lfs -text
|
66 |
+
checkpoint-71/optimizer_0/__36_0.distcp filter=lfs diff=lfs merge=lfs -text
|
67 |
+
checkpoint-71/optimizer_0/__37_0.distcp filter=lfs diff=lfs merge=lfs -text
|
68 |
+
checkpoint-71/optimizer_0/__38_0.distcp filter=lfs diff=lfs merge=lfs -text
|
69 |
+
checkpoint-71/optimizer_0/__39_0.distcp filter=lfs diff=lfs merge=lfs -text
|
70 |
+
checkpoint-71/optimizer_0/__3_0.distcp filter=lfs diff=lfs merge=lfs -text
|
71 |
+
checkpoint-71/optimizer_0/__40_0.distcp filter=lfs diff=lfs merge=lfs -text
|
72 |
+
checkpoint-71/optimizer_0/__41_0.distcp filter=lfs diff=lfs merge=lfs -text
|
73 |
+
checkpoint-71/optimizer_0/__42_0.distcp filter=lfs diff=lfs merge=lfs -text
|
74 |
+
checkpoint-71/optimizer_0/__43_0.distcp filter=lfs diff=lfs merge=lfs -text
|
75 |
+
checkpoint-71/optimizer_0/__44_0.distcp filter=lfs diff=lfs merge=lfs -text
|
76 |
+
checkpoint-71/optimizer_0/__45_0.distcp filter=lfs diff=lfs merge=lfs -text
|
77 |
+
checkpoint-71/optimizer_0/__46_0.distcp filter=lfs diff=lfs merge=lfs -text
|
78 |
+
checkpoint-71/optimizer_0/__47_0.distcp filter=lfs diff=lfs merge=lfs -text
|
79 |
+
checkpoint-71/optimizer_0/__48_0.distcp filter=lfs diff=lfs merge=lfs -text
|
80 |
+
checkpoint-71/optimizer_0/__49_0.distcp filter=lfs diff=lfs merge=lfs -text
|
81 |
+
checkpoint-71/optimizer_0/__4_0.distcp filter=lfs diff=lfs merge=lfs -text
|
82 |
+
checkpoint-71/optimizer_0/__50_0.distcp filter=lfs diff=lfs merge=lfs -text
|
83 |
+
checkpoint-71/optimizer_0/__51_0.distcp filter=lfs diff=lfs merge=lfs -text
|
84 |
+
checkpoint-71/optimizer_0/__52_0.distcp filter=lfs diff=lfs merge=lfs -text
|
85 |
+
checkpoint-71/optimizer_0/__53_0.distcp filter=lfs diff=lfs merge=lfs -text
|
86 |
+
checkpoint-71/optimizer_0/__54_0.distcp filter=lfs diff=lfs merge=lfs -text
|
87 |
+
checkpoint-71/optimizer_0/__55_0.distcp filter=lfs diff=lfs merge=lfs -text
|
88 |
+
checkpoint-71/optimizer_0/__56_0.distcp filter=lfs diff=lfs merge=lfs -text
|
89 |
+
checkpoint-71/optimizer_0/__57_0.distcp filter=lfs diff=lfs merge=lfs -text
|
90 |
+
checkpoint-71/optimizer_0/__58_0.distcp filter=lfs diff=lfs merge=lfs -text
|
91 |
+
checkpoint-71/optimizer_0/__59_0.distcp filter=lfs diff=lfs merge=lfs -text
|
92 |
+
checkpoint-71/optimizer_0/__5_0.distcp filter=lfs diff=lfs merge=lfs -text
|
93 |
+
checkpoint-71/optimizer_0/__60_0.distcp filter=lfs diff=lfs merge=lfs -text
|
94 |
+
checkpoint-71/optimizer_0/__61_0.distcp filter=lfs diff=lfs merge=lfs -text
|
95 |
+
checkpoint-71/optimizer_0/__62_0.distcp filter=lfs diff=lfs merge=lfs -text
|
96 |
+
checkpoint-71/optimizer_0/__63_0.distcp filter=lfs diff=lfs merge=lfs -text
|
97 |
+
checkpoint-71/optimizer_0/__6_0.distcp filter=lfs diff=lfs merge=lfs -text
|
98 |
+
checkpoint-71/optimizer_0/__7_0.distcp filter=lfs diff=lfs merge=lfs -text
|
99 |
+
checkpoint-71/optimizer_0/__8_0.distcp filter=lfs diff=lfs merge=lfs -text
|
100 |
+
checkpoint-71/optimizer_0/__9_0.distcp filter=lfs diff=lfs merge=lfs -text
|
101 |
+
checkpoint-71/pytorch_model_fsdp_0/.metadata filter=lfs diff=lfs merge=lfs -text
|
102 |
+
checkpoint-71/pytorch_model_fsdp_0/__0_0.distcp filter=lfs diff=lfs merge=lfs -text
|
103 |
+
checkpoint-71/pytorch_model_fsdp_0/__10_0.distcp filter=lfs diff=lfs merge=lfs -text
|
104 |
+
checkpoint-71/pytorch_model_fsdp_0/__11_0.distcp filter=lfs diff=lfs merge=lfs -text
|
105 |
+
checkpoint-71/pytorch_model_fsdp_0/__12_0.distcp filter=lfs diff=lfs merge=lfs -text
|
106 |
+
checkpoint-71/pytorch_model_fsdp_0/__13_0.distcp filter=lfs diff=lfs merge=lfs -text
|
107 |
+
checkpoint-71/pytorch_model_fsdp_0/__14_0.distcp filter=lfs diff=lfs merge=lfs -text
|
108 |
+
checkpoint-71/pytorch_model_fsdp_0/__15_0.distcp filter=lfs diff=lfs merge=lfs -text
|
109 |
+
checkpoint-71/pytorch_model_fsdp_0/__16_0.distcp filter=lfs diff=lfs merge=lfs -text
|
110 |
+
checkpoint-71/pytorch_model_fsdp_0/__17_0.distcp filter=lfs diff=lfs merge=lfs -text
|
111 |
+
checkpoint-71/pytorch_model_fsdp_0/__18_0.distcp filter=lfs diff=lfs merge=lfs -text
|
112 |
+
checkpoint-71/pytorch_model_fsdp_0/__19_0.distcp filter=lfs diff=lfs merge=lfs -text
|
113 |
+
checkpoint-71/pytorch_model_fsdp_0/__1_0.distcp filter=lfs diff=lfs merge=lfs -text
|
114 |
+
checkpoint-71/pytorch_model_fsdp_0/__20_0.distcp filter=lfs diff=lfs merge=lfs -text
|
115 |
+
checkpoint-71/pytorch_model_fsdp_0/__21_0.distcp filter=lfs diff=lfs merge=lfs -text
|
116 |
+
checkpoint-71/pytorch_model_fsdp_0/__22_0.distcp filter=lfs diff=lfs merge=lfs -text
|
117 |
+
checkpoint-71/pytorch_model_fsdp_0/__23_0.distcp filter=lfs diff=lfs merge=lfs -text
|
118 |
+
checkpoint-71/pytorch_model_fsdp_0/__24_0.distcp filter=lfs diff=lfs merge=lfs -text
|
119 |
+
checkpoint-71/pytorch_model_fsdp_0/__25_0.distcp filter=lfs diff=lfs merge=lfs -text
|
120 |
+
checkpoint-71/pytorch_model_fsdp_0/__26_0.distcp filter=lfs diff=lfs merge=lfs -text
|
121 |
+
checkpoint-71/pytorch_model_fsdp_0/__27_0.distcp filter=lfs diff=lfs merge=lfs -text
|
122 |
+
checkpoint-71/pytorch_model_fsdp_0/__28_0.distcp filter=lfs diff=lfs merge=lfs -text
|
123 |
+
checkpoint-71/pytorch_model_fsdp_0/__29_0.distcp filter=lfs diff=lfs merge=lfs -text
|
124 |
+
checkpoint-71/pytorch_model_fsdp_0/__2_0.distcp filter=lfs diff=lfs merge=lfs -text
|
125 |
+
checkpoint-71/pytorch_model_fsdp_0/__30_0.distcp filter=lfs diff=lfs merge=lfs -text
|
126 |
+
checkpoint-71/pytorch_model_fsdp_0/__31_0.distcp filter=lfs diff=lfs merge=lfs -text
|
127 |
+
checkpoint-71/pytorch_model_fsdp_0/__32_0.distcp filter=lfs diff=lfs merge=lfs -text
|
128 |
+
checkpoint-71/pytorch_model_fsdp_0/__33_0.distcp filter=lfs diff=lfs merge=lfs -text
|
129 |
+
checkpoint-71/pytorch_model_fsdp_0/__34_0.distcp filter=lfs diff=lfs merge=lfs -text
|
130 |
+
checkpoint-71/pytorch_model_fsdp_0/__35_0.distcp filter=lfs diff=lfs merge=lfs -text
|
131 |
+
checkpoint-71/pytorch_model_fsdp_0/__36_0.distcp filter=lfs diff=lfs merge=lfs -text
|
132 |
+
checkpoint-71/pytorch_model_fsdp_0/__37_0.distcp filter=lfs diff=lfs merge=lfs -text
|
133 |
+
checkpoint-71/pytorch_model_fsdp_0/__38_0.distcp filter=lfs diff=lfs merge=lfs -text
|
134 |
+
checkpoint-71/pytorch_model_fsdp_0/__39_0.distcp filter=lfs diff=lfs merge=lfs -text
|
135 |
+
checkpoint-71/pytorch_model_fsdp_0/__3_0.distcp filter=lfs diff=lfs merge=lfs -text
|
136 |
+
checkpoint-71/pytorch_model_fsdp_0/__40_0.distcp filter=lfs diff=lfs merge=lfs -text
|
137 |
+
checkpoint-71/pytorch_model_fsdp_0/__41_0.distcp filter=lfs diff=lfs merge=lfs -text
|
138 |
+
checkpoint-71/pytorch_model_fsdp_0/__42_0.distcp filter=lfs diff=lfs merge=lfs -text
|
139 |
+
checkpoint-71/pytorch_model_fsdp_0/__43_0.distcp filter=lfs diff=lfs merge=lfs -text
|
140 |
+
checkpoint-71/pytorch_model_fsdp_0/__44_0.distcp filter=lfs diff=lfs merge=lfs -text
|
141 |
+
checkpoint-71/pytorch_model_fsdp_0/__45_0.distcp filter=lfs diff=lfs merge=lfs -text
|
142 |
+
checkpoint-71/pytorch_model_fsdp_0/__46_0.distcp filter=lfs diff=lfs merge=lfs -text
|
143 |
+
checkpoint-71/pytorch_model_fsdp_0/__47_0.distcp filter=lfs diff=lfs merge=lfs -text
|
144 |
+
checkpoint-71/pytorch_model_fsdp_0/__48_0.distcp filter=lfs diff=lfs merge=lfs -text
|
145 |
+
checkpoint-71/pytorch_model_fsdp_0/__49_0.distcp filter=lfs diff=lfs merge=lfs -text
|
146 |
+
checkpoint-71/pytorch_model_fsdp_0/__4_0.distcp filter=lfs diff=lfs merge=lfs -text
|
147 |
+
checkpoint-71/pytorch_model_fsdp_0/__50_0.distcp filter=lfs diff=lfs merge=lfs -text
|
148 |
+
checkpoint-71/pytorch_model_fsdp_0/__51_0.distcp filter=lfs diff=lfs merge=lfs -text
|
149 |
+
checkpoint-71/pytorch_model_fsdp_0/__52_0.distcp filter=lfs diff=lfs merge=lfs -text
|
150 |
+
checkpoint-71/pytorch_model_fsdp_0/__53_0.distcp filter=lfs diff=lfs merge=lfs -text
|
151 |
+
checkpoint-71/pytorch_model_fsdp_0/__54_0.distcp filter=lfs diff=lfs merge=lfs -text
|
152 |
+
checkpoint-71/pytorch_model_fsdp_0/__55_0.distcp filter=lfs diff=lfs merge=lfs -text
|
153 |
+
checkpoint-71/pytorch_model_fsdp_0/__56_0.distcp filter=lfs diff=lfs merge=lfs -text
|
154 |
+
checkpoint-71/pytorch_model_fsdp_0/__57_0.distcp filter=lfs diff=lfs merge=lfs -text
|
155 |
+
checkpoint-71/pytorch_model_fsdp_0/__58_0.distcp filter=lfs diff=lfs merge=lfs -text
|
156 |
+
checkpoint-71/pytorch_model_fsdp_0/__59_0.distcp filter=lfs diff=lfs merge=lfs -text
|
157 |
+
checkpoint-71/pytorch_model_fsdp_0/__5_0.distcp filter=lfs diff=lfs merge=lfs -text
|
158 |
+
checkpoint-71/pytorch_model_fsdp_0/__60_0.distcp filter=lfs diff=lfs merge=lfs -text
|
159 |
+
checkpoint-71/pytorch_model_fsdp_0/__61_0.distcp filter=lfs diff=lfs merge=lfs -text
|
160 |
+
checkpoint-71/pytorch_model_fsdp_0/__62_0.distcp filter=lfs diff=lfs merge=lfs -text
|
161 |
+
checkpoint-71/pytorch_model_fsdp_0/__63_0.distcp filter=lfs diff=lfs merge=lfs -text
|
162 |
+
checkpoint-71/pytorch_model_fsdp_0/__6_0.distcp filter=lfs diff=lfs merge=lfs -text
|
163 |
+
checkpoint-71/pytorch_model_fsdp_0/__7_0.distcp filter=lfs diff=lfs merge=lfs -text
|
164 |
+
checkpoint-71/pytorch_model_fsdp_0/__8_0.distcp filter=lfs diff=lfs merge=lfs -text
|
165 |
+
checkpoint-71/pytorch_model_fsdp_0/__9_0.distcp filter=lfs diff=lfs merge=lfs -text
|
166 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
base_model: deepseek-ai/DeepSeek-R1-Distill-Llama-8B
|
3 |
+
library_name: transformers
|
4 |
+
model_name:
|
5 |
+
tags:
|
6 |
+
- sft
|
7 |
+
- full-finetuning
|
8 |
+
tags:
|
9 |
+
- generated_from_trainer
|
10 |
+
licence: license
|
11 |
+
---
|
12 |
+
|
13 |
+
# Model Card for {'tags': ['sft', 'full-finetuning']}
|
14 |
+
|
15 |
+
This model is a fine-tuned version of [deepseek-ai/DeepSeek-R1-Distill-Llama-8B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Llama-8B).
|
16 |
+
It has been trained using [TRL](https://github.com/huggingface/trl).
|
17 |
+
|
18 |
+
## Quick start
|
19 |
+
|
20 |
+
```python
|
21 |
+
from transformers import pipeline
|
22 |
+
|
23 |
+
question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
|
24 |
+
generator = pipeline("text-generation", model="None", device="cuda")
|
25 |
+
output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
|
26 |
+
print(output["generated_text"])
|
27 |
+
```
|
28 |
+
|
29 |
+
## Training procedure
|
30 |
+
|
31 |
+
|
32 |
+
|
33 |
+
|
34 |
+
This model was trained with SFT.
|
35 |
+
|
36 |
+
### Framework versions
|
37 |
+
|
38 |
+
- TRL: 0.13.0
|
39 |
+
- Transformers: 4.46.0
|
40 |
+
- Pytorch: 2.4.0
|
41 |
+
- Datasets: 3.2.0
|
42 |
+
- Tokenizers: 0.20.1
|
43 |
+
|
44 |
+
## Citations
|
45 |
+
|
46 |
+
|
47 |
+
|
48 |
+
Cite TRL as:
|
49 |
+
|
50 |
+
```bibtex
|
51 |
+
@misc{vonwerra2022trl,
|
52 |
+
title = {{TRL: Transformer Reinforcement Learning}},
|
53 |
+
author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallouédec},
|
54 |
+
year = 2020,
|
55 |
+
journal = {GitHub repository},
|
56 |
+
publisher = {GitHub},
|
57 |
+
howpublished = {\url{https://github.com/huggingface/trl}}
|
58 |
+
}
|
59 |
+
```
|
all_results.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 0.993006993006993,
|
3 |
+
"total_flos": 1.6814365427000934e+17,
|
4 |
+
"train_loss": 1.0495624525446288,
|
5 |
+
"train_runtime": 12091.2309,
|
6 |
+
"train_samples": 43759,
|
7 |
+
"train_samples_per_second": 4.529,
|
8 |
+
"train_steps_per_second": 0.006
|
9 |
+
}
|
checkpoint-71/optimizer_0/.metadata
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b543975e32cfc638b69de6f3f0efce4a329a1bffd016ddf13ab49dd14cba34a7
|
3 |
+
size 7326437
|
checkpoint-71/optimizer_0/__0_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0cec445fc052f47619083c7f5e8b7d85afb9f2cceda069ba212de63052123aa
|
3 |
+
size 1004469416
|
checkpoint-71/optimizer_0/__10_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec98c4330115322acd50987209d2255f0e6faf7a178e844367bbe31282986b2a
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__11_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27b1c34d0a6b6c4660dba9ab5a5ed8efed5dd7051e3033cd893b9a04971dde84
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__12_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7619afac97039abcd17e59a74773fabe38fdef20954a98d00af294420e5c2a5a
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__13_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:603eee538d85aceb9012de4c9c2a2d1836d95e1d05767b2f373c981e3f1a871c
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__14_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:908ec24e148aa120e255599f666061aa00046eb8d6a4f17adb22195d5d9fbf2e
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__15_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0442bcb7c394360107abd08add7aa7dab0a2b57a6ab350f001132996b4bd3045
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__16_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c87a403ba95856910c39a9c98c910d00187611392a287ee46a02e3bc9324fe4
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__17_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7223d78deacc58c93cec8a1f081d7afe2e7b7e9b3c7a65285222375e7d68e3b
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__18_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c1275bc9ad19f5f587fff8f93d9b25f914d7de5231dbd93a374922ffb6c2381
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__19_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2116388a557a68f97a78ea1fa18266f473d4286c9d59f4afb56153c600c04dad
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__1_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad242006b33e0307ccbb9d1f76e163517e6be79a734ec02569e62f6bcc4bb690
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__20_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0c44e59a58a2675bd697b763f349cc6762fd2b97b3cbe9d6018b6f4a00ef947
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__21_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9081ac24f52d114eb82b6279e675f60472efa96c186253085fa7ca13c655673
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__22_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97b99215abb812eb2d5a65c3279acefa3f8ad99223ef53bd05c783bb2bec624e
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__23_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a62ed26cfb5a9f94a0f774f6671935762a467f72cba37e54b18af5ef38bf2d5
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__24_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:050b7939615da96106772afc82a2cd9567028ae93932563b5321bafe18cbe1fa
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__25_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2aec6361ee1502f89430f1ffddd3abb5b7383fd37933ab90e01b361ef2835b9c
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__26_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:600f232035946120ac1390f57021a34f17bea2d5dfd805d9a4e83a3964ec6995
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__27_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd883db282faed4c2b4cc7658afb59d68d60d1d2c0a6b91aa1ea47638414b91a
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__28_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9098c47787db85588e8ec5368a55329482d739eff6681a7fc50b575ef8e58ed4
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__29_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa671264a735d0e8bcfed175b877cfc31e9f789e7f53f319c71908e0768f43e7
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__2_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0ee2fadd77b89fba0684dcfd30a88cc7a567af8a64f97368ede8964d2af3fb6
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__30_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a042ab745adbc8330594cd861d6020e2c40bc8a45742926263425a4c329173f
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__31_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49ed97969b385229ca5dba05fc00a8e1a8bb715bafde0aefc9adde7ea6f78600
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__32_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff73360edc4f49e98c9c1ee8b2adcb3d1e4e9a03349912484d6765058cb17f7e
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__33_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa8ad1a4d67e0f243cf0eddb302dd524e66027ed3ad05e6f25adca2f7de28f2d
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__34_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3cb88e4f2e27a4e228786f3d91f7a660a51feb3def2d001c0bf2db519b7732c
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__35_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9eafdba6d23a43d868da37bfb3c5b9de2140ceb46e9c4ecfafb6529841dbe56
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__36_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2817bb28216be7795ceff9d86092df0deff15ed54a78332d7c2425255c3cab48
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__37_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf362a32f842c01c36ffb2a999d9ab26554bd8afef72ad0a3b7c464c5df760e8
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__38_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63def0f1361594d2192d24c0eeabb1959ad022413c0cb0e37673f303d903f6e7
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__39_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30be6d7cacb28ef8f695cdd7eb98d778d4762de1999291da73920cd4e065f265
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__3_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:948002b45c957d1b19a2a9416c67f9b10d5bfd32af440486f8b970560cf9a5d2
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__40_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb12ad38a29bdabcbadd4a33ece7f0191c40c9af33e840b4f18c3eef6d5f431f
|
3 |
+
size 1004475000
|
checkpoint-71/optimizer_0/__41_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd777702ce109ff00d2f0830586c00a3e64eb78b88441f50329e8854e26929f3
|
3 |
+
size 1004475000
|
checkpoint-71/optimizer_0/__42_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63df45d6a488d04e261c75ada2c7f5c4d4151d1f716890f8d6af3d254dbc6297
|
3 |
+
size 1004475000
|
checkpoint-71/optimizer_0/__43_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb4f9daaff7e3b0d8fe85d6acfac683808c879669c394568b6ef6024582dfd4f
|
3 |
+
size 1004475000
|
checkpoint-71/optimizer_0/__44_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2ed8d095dd9ca0d577e596fa5b82e203914a77cf5325084ce50bb6af08fac65
|
3 |
+
size 1004475000
|
checkpoint-71/optimizer_0/__45_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be2ffc9df0516a623f0701d35540e40d7984a09256e13cc773f68e78a755b06d
|
3 |
+
size 1004475000
|
checkpoint-71/optimizer_0/__46_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:767f4bab783673cb96ab4373f6ada658e0d10cd58bc84f6219b0e18537251e16
|
3 |
+
size 1004475000
|
checkpoint-71/optimizer_0/__47_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea8b772a1fdb14eb190b915d6602c1ebc66c3cc2187b64423bd4048ee2312a95
|
3 |
+
size 1004475000
|
checkpoint-71/optimizer_0/__48_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1515228871e89e286700857a9123d5c1f3bf732f227847c67ea802f8766ff90
|
3 |
+
size 1004475000
|
checkpoint-71/optimizer_0/__49_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd133e09b4e511ea9d4b229b446a8fc1725d30953caedb6f12f42e96449c07ed
|
3 |
+
size 1004475000
|
checkpoint-71/optimizer_0/__4_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10fda3d3a2d843c1d5098d2ee1d25d2a6daf8ddaafdec9d7aa16d02157aff752
|
3 |
+
size 1004475316
|
checkpoint-71/optimizer_0/__50_0.distcp
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d03cab7298b118ce7b75a57aed37085bba683771317a6a758f318634536945d
|
3 |
+
size 1004475000
|