mouseyy commited on
Commit
49f8dbc
·
verified ·
1 Parent(s): 4461cc2

Training in progress, step 1000

Browse files
Files changed (3) hide show
  1. config.json +7 -7
  2. model.safetensors +1 -1
  3. training_args.bin +1 -1
config.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "_name_or_path": "mouseyy/result_data-1",
3
- "activation_dropout": 0.07393755234042465,
4
  "adapter_attn_dim": null,
5
  "adapter_kernel_size": 3,
6
  "adapter_stride": 2,
@@ -9,7 +9,7 @@
9
  "architectures": [
10
  "Wav2Vec2ForCTC"
11
  ],
12
- "attention_dropout": 0.02799881189017002,
13
  "bos_token_id": 1,
14
  "classifier_proj_size": 256,
15
  "codevector_dim": 768,
@@ -50,23 +50,23 @@
50
  "feat_extract_activation": "gelu",
51
  "feat_extract_dropout": 0.0,
52
  "feat_extract_norm": "layer",
53
- "feat_proj_dropout": 0.06639458235849151,
54
  "feat_quantizer_dropout": 0.0,
55
  "final_dropout": 0.0,
56
  "gradient_checkpointing": false,
57
  "hidden_act": "gelu",
58
- "hidden_dropout": 0.010817510288940036,
59
  "hidden_size": 1024,
60
  "initializer_range": 0.02,
61
  "intermediate_size": 4096,
62
  "layer_norm_eps": 1e-05,
63
- "layerdrop": 0.07393755234042465,
64
  "mask_feature_length": 10,
65
  "mask_feature_min_masks": 0,
66
- "mask_feature_prob": 0.02863724192728596,
67
  "mask_time_length": 10,
68
  "mask_time_min_masks": 2,
69
- "mask_time_prob": 0.02863724192728596,
70
  "model_type": "wav2vec2",
71
  "num_adapter_layers": 3,
72
  "num_attention_heads": 16,
 
1
  {
2
  "_name_or_path": "mouseyy/result_data-1",
3
+ "activation_dropout": 0.015195612302688774,
4
  "adapter_attn_dim": null,
5
  "adapter_kernel_size": 3,
6
  "adapter_stride": 2,
 
9
  "architectures": [
10
  "Wav2Vec2ForCTC"
11
  ],
12
+ "attention_dropout": 0.04564076009672891,
13
  "bos_token_id": 1,
14
  "classifier_proj_size": 256,
15
  "codevector_dim": 768,
 
50
  "feat_extract_activation": "gelu",
51
  "feat_extract_dropout": 0.0,
52
  "feat_extract_norm": "layer",
53
+ "feat_proj_dropout": 0.022155837435835574,
54
  "feat_quantizer_dropout": 0.0,
55
  "final_dropout": 0.0,
56
  "gradient_checkpointing": false,
57
  "hidden_act": "gelu",
58
+ "hidden_dropout": 0.03972759892699478,
59
  "hidden_size": 1024,
60
  "initializer_range": 0.02,
61
  "intermediate_size": 4096,
62
  "layer_norm_eps": 1e-05,
63
+ "layerdrop": 0.015195612302688774,
64
  "mask_feature_length": 10,
65
  "mask_feature_min_masks": 0,
66
+ "mask_feature_prob": 0.03627889583101227,
67
  "mask_time_length": 10,
68
  "mask_time_min_masks": 2,
69
+ "mask_time_prob": 0.03627889583101227,
70
  "model_type": "wav2vec2",
71
  "num_adapter_layers": 3,
72
  "num_attention_heads": 16,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aafc1f758008a10721c82d641bc622a590fc70bcf9733fa32b992b03721694af
3
  size 1261971480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce869097e9d40ff51f879c3acf794a39f926eaa9359732e42a2a77a280c92efa
3
  size 1261971480
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c63b5179af3b259aa6290032ad269ee22e7160967970313d8fec41c05bde415f
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:853893324eb07344fdec49bd69f27d31740bbdb6f6022ac3513a1741e7fe8b2a
3
  size 5432