martinctl commited on
Commit
76a5839
·
verified ·
1 Parent(s): c89ae93

Add training configuration

Browse files
Files changed (1) hide show
  1. training_config.json +19 -0
training_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "timestamp": "2025-05-26T17:27:49.001547",
3
+ "model_name": "Qwen/Qwen3-0.6B-Base",
4
+ "data_path": "data/mcqa_training_format.tsv",
5
+ "use_context": false,
6
+ "eval_with_context": false,
7
+ "epochs": 5,
8
+ "batch_size": 2,
9
+ "learning_rate": 5e-05,
10
+ "test_size": 0.1,
11
+ "max_samples": null,
12
+ "output_dir": "./qwen-mcqa-ft",
13
+ "baseline_only": false,
14
+ "eval_only": false,
15
+ "quantize_only": false,
16
+ "quantization": "8bit",
17
+ "device": "cuda",
18
+ "torch_version": "2.5.1+cu124"
19
+ }