Automatic Speech Recognition
PEFT
TensorBoard
Safetensors
Generated from Trainer
lowhipa-large-comb / ft_config.json
jshrdt's picture
Upload folder using huggingface_hub
af0588a verified
{
"modelname": "openai/whisper-large-v2",
"gen_args": {"num_beams": 3},
"fallback": [7,5,1],
"corpora": {
"train": {
"asc": {
"languages": "ara",
"limit": [
1000
]
},
"multipa": {
"languages": [
"ja",
"pl",
"mt",
"hu",
"fi",
"el",
"ta"
],
"limit": [
1000,
1000,
1000,
1000,
1000,
1000,
1000
]
},
"thchs": {
"languages": "cmn",
"limit": [
1000
]
}
},
"dev": {
"asc": {
"languages": "ara",
"limit": [
50
]
},
"multipa": {
"languages": [
"ja",
"pl",
"mt",
"hu",
"fi",
"el",
"ta"
],
"limit": [
50,
50,
50,
50,
50,
50,
50
]
},
"thchs": {
"languages": "cmn",
"limit": [
50
]
}
}
},
"hyperparams": {
"output_dir": "../models/lowhipa-large-comb",
"overwrite_output_dir": "True",
"peft": "True",
"per_device_train_batch_size": 64,
"gradient_accumulation_steps": 1,
"learning_rate": 0.001,
"warmup_ratio": 0.1,
"max_steps": 1410,
"gradient_checkpointing": "True",
"fp16": "True",
"eval_strategy": "steps",
"per_device_eval_batch_size": 8,
"predict_with_generate": "True",
"generation_max_length": 225,
"save_steps": 282,
"eval_steps": 282,
"logging_steps": 282,
"logging_first_step": "True",
"report_to": [
"tensorboard"
],
"load_best_model_at_end": "False",
"metric_for_best_model": "pfer",
"greater_is_better": "False",
"hub_private_repo": "True",
"push_to_hub": "False",
"torch_empty_cache_steps": 4
}
}