quablab commited on
Commit
0807ac1
·
verified ·
1 Parent(s): 8e867aa

Training in progress, step 250

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: smollm3-dpo-aligned
5
  tags:
6
  - generated_from_trainer
7
- - dpo
8
  - trl
 
9
  - hf_jobs
10
  licence: license
11
  ---
@@ -38,7 +38,7 @@ This model was trained with DPO, a method introduced in [Direct Preference Optim
38
  - TRL: 0.23.1
39
  - Transformers: 4.57.0
40
  - Pytorch: 2.8.0
41
- - Datasets: 4.1.1
42
  - Tokenizers: 0.22.1
43
 
44
  ## Citations
 
4
  model_name: smollm3-dpo-aligned
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - dpo
9
  - hf_jobs
10
  licence: license
11
  ---
 
38
  - TRL: 0.23.1
39
  - Transformers: 4.57.0
40
  - Pytorch: 2.8.0
41
+ - Datasets: 4.2.0
42
  - Tokenizers: 0.22.1
43
 
44
  ## Citations
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b180a72bff2c203fbfe0944193a818650fc787a46ca7cb7f4949cf666000d439
3
  size 4932711224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27ea17dcd3aa343959a976b1b6353187f5d56b83d93f59a542e981e0d9eadd48
3
  size 4932711224
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:acfa0dbd9cfb935e72b3489652a99a7769e964c935fe9d217e455722d16f7822
3
  size 4999889128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d297a49ddf624fb29a13e4f9dd213d44ffd1a5e2d9d7812b3c29de5b84942d3c
3
  size 4999889128
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa7042b5dcd2c151b5be60ca7b7fdc34455c2d5bf0a5a5c00ece5f3fa0f66d32
3
  size 2367831672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65918e207cd42a56248e9f19f2adeb870af1d6438807da1a312306d4ea1083d2
3
  size 2367831672
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4ef81110d7b4d7111f6d4193557a68e977d32353a2667651a384114b4dd4563
3
  size 6865
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a070aab623ee5d67c053edef8d7c47ad27c728d8fe38fc3a0cd854a9efa218dc
3
  size 6865