|
{ |
|
"experiment_summary": { |
|
"timestamp": "2025-05-26T20:36:55.416522", |
|
"model_name": "Qwen/Qwen3-0.6B-Base", |
|
"use_context_training": false, |
|
"use_context_evaluation": false, |
|
"quantization": "8bit", |
|
"quantize_only": false, |
|
"max_samples": null |
|
}, |
|
"results": { |
|
"baseline_accuracy": 0.6966019417475728, |
|
"fine_tuned_accuracy": 0.7067961165048544, |
|
"improvement": 0.010194174757281571, |
|
"improvement_percentage": "+1.02%" |
|
}, |
|
"training_config": { |
|
"timestamp": "2025-05-26T17:27:49.001547", |
|
"model_name": "Qwen/Qwen3-0.6B-Base", |
|
"data_path": "data/mcqa_training_format.tsv", |
|
"use_context": false, |
|
"eval_with_context": false, |
|
"epochs": 5, |
|
"batch_size": 2, |
|
"learning_rate": 5e-05, |
|
"test_size": 0.1, |
|
"max_samples": null, |
|
"output_dir": "./qwen-mcqa-ft", |
|
"baseline_only": false, |
|
"eval_only": false, |
|
"quantize_only": false, |
|
"quantization": "8bit", |
|
"device": "cuda", |
|
"torch_version": "2.5.1+cu124" |
|
}, |
|
"success": true |
|
} |