Priyanship commited on
Commit
e84ee48
·
verified ·
1 Parent(s): a9470fa

End of training

Browse files
README.md ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - generated_from_trainer
4
+ model-index:
5
+ - name: pd_warmup250
6
+ results: []
7
+ ---
8
+
9
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
10
+ should probably proofread and complete it, then remove this comment. -->
11
+
12
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="200" height="32"/>](https://wandb.ai/priyanshipal/huggingface/runs/18ql5rrq)
13
+ # pd_warmup250
14
+
15
+ This model was trained from scratch on an unknown dataset.
16
+ It achieves the following results on the evaluation set:
17
+ - eval_loss: 21.9274
18
+ - eval_model_preparation_time: 0.0061
19
+ - eval_cer: 2.6007
20
+ - eval_wer: 1.0
21
+ - eval_runtime: 183.4843
22
+ - eval_samples_per_second: 17.091
23
+ - eval_steps_per_second: 1.068
24
+ - step: 0
25
+
26
+ ## Model description
27
+
28
+ More information needed
29
+
30
+ ## Intended uses & limitations
31
+
32
+ More information needed
33
+
34
+ ## Training and evaluation data
35
+
36
+ More information needed
37
+
38
+ ## Training procedure
39
+
40
+ ### Training hyperparameters
41
+
42
+ The following hyperparameters were used during training:
43
+ - learning_rate: 0.0006
44
+ - train_batch_size: 16
45
+ - eval_batch_size: 16
46
+ - seed: 400
47
+ - gradient_accumulation_steps: 2
48
+ - total_train_batch_size: 32
49
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
50
+ - lr_scheduler_type: linear
51
+ - lr_scheduler_warmup_steps: 250
52
+ - num_epochs: 30.0
53
+ - mixed_precision_training: Native AMP
54
+
55
+ ### Framework versions
56
+
57
+ - Transformers 4.43.1
58
+ - Pytorch 2.4.0
59
+ - Datasets 2.20.0
60
+ - Tokenizers 0.19.1
all_results.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eval_cer": 2.600693686104438,
3
+ "eval_loss": 21.927419662475586,
4
+ "eval_model_preparation_time": 0.0061,
5
+ "eval_runtime": 183.4843,
6
+ "eval_samples": 3136,
7
+ "eval_samples_per_second": 17.091,
8
+ "eval_steps_per_second": 1.068,
9
+ "eval_wer": 1.0
10
+ }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/m/triton/scratch/elec/puhe/p/palp3/MUCS/indicwav2vec-hindi",
3
  "activation_dropout": 0.0,
4
  "adapter_attn_dim": null,
5
  "adapter_kernel_size": 3,
 
1
  {
2
+ "_name_or_path": "/m/triton/scratch/elec/puhe/p/palp3/MUCS/indicwav2vec_outputs/pd_warmup250",
3
  "activation_dropout": 0.0,
4
  "adapter_attn_dim": null,
5
  "adapter_kernel_size": 3,
eval_results.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eval_cer": 2.600693686104438,
3
+ "eval_loss": 21.927419662475586,
4
+ "eval_model_preparation_time": 0.0061,
5
+ "eval_runtime": 183.4843,
6
+ "eval_samples": 3136,
7
+ "eval_samples_per_second": 17.091,
8
+ "eval_steps_per_second": 1.068,
9
+ "eval_wer": 1.0
10
+ }
json/default-e1fa1bd3a5ee0c77/0.0.0/7483f22a71512872c377524b97484f6d20c275799bb9e7cd8fb3198178d8220a.incomplete_info.lock ADDED
File without changes
json/default-e1fa1bd3a5ee0c77/0.0.0/7483f22a71512872c377524b97484f6d20c275799bb9e7cd8fb3198178d8220a/dataset_info.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"description": "", "citation": "", "homepage": "", "license": "", "features": {"audio_id": {"dtype": "string", "_type": "Value"}, "audio_paths": {"dtype": "string", "_type": "Value"}, "transcriptions": {"dtype": "string", "_type": "Value"}}, "builder_name": "json", "dataset_name": "json", "config_name": "default", "version": {"version_str": "0.0.0", "major": 0, "minor": 0, "patch": 0}, "splits": {"train": {"name": "train", "num_bytes": 791200, "num_examples": 3136, "dataset_name": "json"}}, "download_checksums": {"/m/triton/scratch/elec/puhe/p/palp3/MUCS/MUCS_train_test_dataset_dict_v2.json": {"num_bytes": 22505219, "checksum": null}}, "download_size": 22505219, "dataset_size": 791200, "size_in_bytes": 23296419}
json/default-e1fa1bd3a5ee0c77/0.0.0/7483f22a71512872c377524b97484f6d20c275799bb9e7cd8fb3198178d8220a/json-train.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbbe02a419ea87c50b03d02089a41e7a6c114e96411394405f3ca717ade2db7d
3
+ size 793032
json/default-e1fa1bd3a5ee0c77/0.0.0/7483f22a71512872c377524b97484f6d20c275799bb9e7cd8fb3198178d8220a_builder.lock ADDED
File without changes
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d6e542b15e77cd1bb8a7693945d939d7b6324a0178a2a54a151c7870a9a3a70
3
  size 1262426580
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93a3485fafffc5ac46d9c3a04ab47a90b39e1d7d8f31fbf95f3f6474a38b1a61
3
  size 1262426580
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f36285e2633cf53bd969b772d161600517cc1ebe36cfcc307477b6d106ff33c
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd53656a9df562387448fa18aacfe26d6d6bb71426ced564d4ddc09cd4d2ed04
3
  size 5368