yangzhao02 commited on
Commit
3003d30
·
verified ·
1 Parent(s): db0216c

End of training

Browse files
Files changed (4) hide show
  1. README.md +11 -5
  2. all_results.json +10 -0
  3. config.json +1 -1
  4. eval_results.json +13 -0
README.md CHANGED
@@ -3,9 +3,15 @@ library_name: transformers
3
  license: apache-2.0
4
  base_model: Qwen/Qwen2.5-7B-Instruct-1M
5
  tags:
 
 
 
 
6
  - trl
7
  - ndcg
8
  - generated_from_trainer
 
 
9
  model-index:
10
  - name: qwen2.5-7b-lipo
11
  results: []
@@ -16,14 +22,14 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # qwen2.5-7b-lipo
18
 
19
- This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct-1M](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct-1M) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
  - Loss: 0.0017
22
- - Logps: -662.0203
23
- - Logits: -0.6116
24
- - Rank Correct Batch: 16.5244
25
  - Rank Pair Batch: 28.0
26
- - Rank Accuracy Batch: 0.5902
27
 
28
  ## Model description
29
 
 
3
  license: apache-2.0
4
  base_model: Qwen/Qwen2.5-7B-Instruct-1M
5
  tags:
6
+ - alignment-handbook
7
+ - ndcg
8
+ - trl
9
+ - generated_from_trainer
10
  - trl
11
  - ndcg
12
  - generated_from_trainer
13
+ datasets:
14
+ - yangzhao02/ListUltraFeedback
15
  model-index:
16
  - name: qwen2.5-7b-lipo
17
  results: []
 
22
 
23
  # qwen2.5-7b-lipo
24
 
25
+ This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct-1M](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct-1M) on the yangzhao02/ListUltraFeedback dataset.
26
  It achieves the following results on the evaluation set:
27
  - Loss: 0.0017
28
+ - Logps: -661.8630
29
+ - Logits: -0.6117
30
+ - Rank Correct Batch: 16.5203
31
  - Rank Pair Batch: 28.0
32
+ - Rank Accuracy Batch: 0.5900
33
 
34
  ## Model description
35
 
all_results.json CHANGED
@@ -1,5 +1,15 @@
1
  {
2
  "epoch": 0.9982631930527722,
 
 
 
 
 
 
 
 
 
 
3
  "total_flos": 0.0,
4
  "train_loss": 0.0024812357072425285,
5
  "train_runtime": 43392.086,
 
1
  {
2
  "epoch": 0.9982631930527722,
3
+ "eval_logits": -0.6117165684700012,
4
+ "eval_logps": -661.8629760742188,
5
+ "eval_loss": 0.001710074720904231,
6
+ "eval_rank_accuracy_batch": 0.5900115966796875,
7
+ "eval_rank_correct_batch": 16.52032470703125,
8
+ "eval_rank_pair_batch": 28.0,
9
+ "eval_runtime": 601.0399,
10
+ "eval_samples": 1968,
11
+ "eval_samples_per_second": 3.274,
12
+ "eval_steps_per_second": 0.409,
13
  "total_flos": 0.0,
14
  "train_loss": 0.0024812357072425285,
15
  "train_runtime": 43392.086,
config.json CHANGED
@@ -28,7 +28,7 @@
28
  "tie_word_embeddings": false,
29
  "torch_dtype": "bfloat16",
30
  "transformers_version": "4.45.1",
31
- "use_cache": false,
32
  "use_sliding_window": false,
33
  "vocab_size": 152064
34
  }
 
28
  "tie_word_embeddings": false,
29
  "torch_dtype": "bfloat16",
30
  "transformers_version": "4.45.1",
31
+ "use_cache": true,
32
  "use_sliding_window": false,
33
  "vocab_size": 152064
34
  }
eval_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 0.9982631930527722,
3
+ "eval_logits": -0.6117165684700012,
4
+ "eval_logps": -661.8629760742188,
5
+ "eval_loss": 0.001710074720904231,
6
+ "eval_rank_accuracy_batch": 0.5900115966796875,
7
+ "eval_rank_correct_batch": 16.52032470703125,
8
+ "eval_rank_pair_batch": 28.0,
9
+ "eval_runtime": 601.0399,
10
+ "eval_samples": 1968,
11
+ "eval_samples_per_second": 3.274,
12
+ "eval_steps_per_second": 0.409
13
+ }