JayHyeon commited on
Commit
bf1cabf
·
verified ·
1 Parent(s): 70e0eb9

Training in progress, step 500

Browse files
Files changed (3) hide show
  1. config.json +3 -3
  2. model.safetensors +2 -2
  3. training_args.bin +3 -0
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "_name_or_path": "/root/trl/results_v2/Qwen_0.5-DPO_5e-7-3ep_0alp_0lam/checkpoint-1000",
3
  "architectures": [
4
- "Qwen2Model"
5
  ],
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 151643,
@@ -21,7 +21,7 @@
21
  "rope_theta": 1000000.0,
22
  "sliding_window": null,
23
  "tie_word_embeddings": true,
24
- "torch_dtype": "float32",
25
  "transformers_version": "4.47.0.dev0",
26
  "use_cache": false,
27
  "use_mrope": false,
 
1
  {
2
+ "_name_or_path": "JayHyeon/Qwen2.5-0.5B-SFT-2e-5-2ep",
3
  "architectures": [
4
+ "Qwen2ForCausalLM"
5
  ],
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 151643,
 
21
  "rope_theta": 1000000.0,
22
  "sliding_window": null,
23
  "tie_word_embeddings": true,
24
+ "torch_dtype": "bfloat16",
25
  "transformers_version": "4.47.0.dev0",
26
  "use_cache": false,
27
  "use_mrope": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:170fac463719e3515dce45db7ea731a97c41964b2311307b47d067fd2e14f0a1
3
- size 1976161736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a755cb689f3c33c39520ae8c3ccd65ef610a2659b74c8108fcf377bbed2b811
3
+ size 1260367448
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a5320ca4174c5d1dd72c7330bd70fcfed9d7698b365441012342df3e75612c7
3
+ size 7736