|
{ |
|
"modelname": "openai/whisper-large-v2", |
|
"gen_args": {"num_beams": 3}, |
|
"fallback": [7,5,1], |
|
"corpora": { |
|
"train": { |
|
"asc": { |
|
"languages": "ara", |
|
"limit": [ |
|
1000 |
|
] |
|
}, |
|
"multipa": { |
|
"languages": [ |
|
"ja", |
|
"pl", |
|
"mt", |
|
"hu", |
|
"fi", |
|
"el", |
|
"ta" |
|
], |
|
"limit": [ |
|
1000, |
|
1000, |
|
1000, |
|
1000, |
|
1000, |
|
1000, |
|
1000 |
|
] |
|
}, |
|
"thchs": { |
|
"languages": "cmn", |
|
"limit": [ |
|
1000 |
|
] |
|
} |
|
}, |
|
"dev": { |
|
"asc": { |
|
"languages": "ara", |
|
"limit": [ |
|
50 |
|
] |
|
}, |
|
"multipa": { |
|
"languages": [ |
|
"ja", |
|
"pl", |
|
"mt", |
|
"hu", |
|
"fi", |
|
"el", |
|
"ta" |
|
], |
|
"limit": [ |
|
50, |
|
50, |
|
50, |
|
50, |
|
50, |
|
50, |
|
50 |
|
] |
|
}, |
|
"thchs": { |
|
"languages": "cmn", |
|
"limit": [ |
|
50 |
|
] |
|
} |
|
} |
|
}, |
|
"hyperparams": { |
|
"output_dir": "../models/lowhipa-large-comb", |
|
"overwrite_output_dir": "True", |
|
"peft": "True", |
|
"per_device_train_batch_size": 64, |
|
"gradient_accumulation_steps": 1, |
|
"learning_rate": 0.001, |
|
"warmup_ratio": 0.1, |
|
"max_steps": 1410, |
|
"gradient_checkpointing": "True", |
|
"fp16": "True", |
|
"eval_strategy": "steps", |
|
"per_device_eval_batch_size": 8, |
|
"predict_with_generate": "True", |
|
"generation_max_length": 225, |
|
"save_steps": 282, |
|
"eval_steps": 282, |
|
"logging_steps": 282, |
|
"logging_first_step": "True", |
|
"report_to": [ |
|
"tensorboard" |
|
], |
|
"load_best_model_at_end": "False", |
|
"metric_for_best_model": "pfer", |
|
"greater_is_better": "False", |
|
"hub_private_repo": "True", |
|
"push_to_hub": "False", |
|
"torch_empty_cache_steps": 4 |
|
} |
|
} |