pere commited on
Commit
e8127c4
·
1 Parent(s): adc1547

trying first training

Browse files
Files changed (1) hide show
  1. run_large_training.sh +6 -5
run_large_training.sh CHANGED
@@ -1,13 +1,13 @@
1
  #!/usr/bin/env bash
2
  accelerate launch run_distillation.py \
3
- --model_name_or_path "./previous-36500-epoch1-wer-15-250" \
4
  --teacher_model_name_or_path "NbAiLab/nb-whisper-large" \
5
  --train_dataset_name "NbAiLab/annotated_distil_raw_ncc_speech_v7_large" \
6
  --train_dataset_config_name "" \
7
  --train_split_name "train" \
8
- --eval_dataset_name "NbAiLab/annotated_distil_raw_ncc_speech_v7_large" \
9
  --eval_dataset_config_name "" \
10
- --eval_split_name "validation" \
11
  --eval_steps 500 \
12
  --save_steps 1000 \
13
  --warmup_steps 1000 \
@@ -19,7 +19,7 @@ accelerate launch run_distillation.py \
19
  --task "transcribe" \
20
  --logging_steps 200 \
21
  --save_total_limit 1 \
22
- --max_steps 10000 \
23
  --wer_threshold 5 \
24
  --per_device_train_batch_size 32 \
25
  --per_device_eval_batch_size 32 \
@@ -38,6 +38,7 @@ accelerate launch run_distillation.py \
38
  --freeze_embed_positions \
39
  --streaming True \
40
  --wandb_project "nb-distil-whisper-large-pytorch" \
41
- --wandb_name "pytorch2_lr3e4_wer5" \
 
42
  --push_to_hub
43
 
 
1
  #!/usr/bin/env bash
2
  accelerate launch run_distillation.py \
3
+ --model_name_or_path "./nb-distil-large-init" \
4
  --teacher_model_name_or_path "NbAiLab/nb-whisper-large" \
5
  --train_dataset_name "NbAiLab/annotated_distil_raw_ncc_speech_v7_large" \
6
  --train_dataset_config_name "" \
7
  --train_split_name "train" \
8
+ --eval_dataset_name "NbAiLab/ncc_speech_v7" \
9
  --eval_dataset_config_name "" \
10
+ --eval_split_name "validation_norwegian_fleurs" \
11
  --eval_steps 500 \
12
  --save_steps 1000 \
13
  --warmup_steps 1000 \
 
19
  --task "transcribe" \
20
  --logging_steps 200 \
21
  --save_total_limit 1 \
22
+ --max_steps 100000 \
23
  --wer_threshold 5 \
24
  --per_device_train_batch_size 32 \
25
  --per_device_eval_batch_size 32 \
 
38
  --freeze_embed_positions \
39
  --streaming True \
40
  --wandb_project "nb-distil-whisper-large-pytorch" \
41
+ --wandb_name "pytorch_lr3e4_wer10" \
42
+ --hub_model_id "NbAiLab/nb-distil-whisper-large-pytorch-wer10" \
43
  --push_to_hub
44