openvino-ci commited on
Commit
748efc8
·
verified ·
1 Parent(s): 1ef483b

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -1,19 +1,126 @@
1
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  license: apache-2.0
3
  license_link: https://choosealicense.com/licenses/apache-2.0/
4
  ---
 
5
  # whisper-large-v3-fp16-ov
6
- * Model creator: [Openai](https://huggingface.co/openai)
7
  * Original model: [whisper-large-v3](https://huggingface.co/openai/whisper-large-v3)
8
 
9
  ## Description
 
10
 
11
  ## Compatibility
12
 
13
  The provided OpenVINO™ IR model is compatible with:
14
 
15
- * OpenVINO version 2024.5.0 and higher
16
- * Optimum Intel 1.21.0 and higher
17
 
18
 
19
  ## Running Model Inference with [Optimum Intel](https://huggingface.co/docs/optimum/intel/index)
@@ -27,6 +134,7 @@ pip install optimum[openvino]
27
  2. Run model inference:
28
 
29
  ```
 
30
  from transformers import AutoProcessor
31
  from optimum.intel.openvino import OVModelForSpeechSeq2Seq
32
 
@@ -37,14 +145,14 @@ model = OVModelForSpeechSeq2Seq.from_pretrained(model_id)
37
  dataset = load_dataset("hf-internal-testing/librispeech_asr_dummy", "clean", split="validation", trust_remote_code=True)
38
  sample = dataset[0]
39
 
40
- input_features = processor(
41
  sample["audio"]["array"],
42
  sampling_rate=sample["audio"]["sampling_rate"],
43
  return_tensors="pt",
44
  ).input_features
45
 
46
  outputs = model.generate(input_features)
47
- text = processor.batch_decode(outputs)[0]
48
  print(text)
49
  ```
50
 
@@ -78,7 +186,7 @@ device = "CPU"
78
  pipe = ov_genai.WhisperPipeline(model_path, device)
79
 
80
  dataset = load_dataset("hf-internal-testing/librispeech_asr_dummy", "clean", split="validation", trust_remote_code=True)
81
- sample = dataset[0]["audio]["array"]
82
  print(pipe.generate(sample))
83
  ```
84
 
 
1
  ---
2
+ language:
3
+ - en
4
+ - zh
5
+ - de
6
+ - es
7
+ - ru
8
+ - ko
9
+ - fr
10
+ - ja
11
+ - pt
12
+ - tr
13
+ - pl
14
+ - ca
15
+ - nl
16
+ - ar
17
+ - sv
18
+ - it
19
+ - id
20
+ - hi
21
+ - fi
22
+ - vi
23
+ - he
24
+ - uk
25
+ - el
26
+ - ms
27
+ - cs
28
+ - ro
29
+ - da
30
+ - hu
31
+ - ta
32
+ - no
33
+ - th
34
+ - ur
35
+ - hr
36
+ - bg
37
+ - lt
38
+ - la
39
+ - mi
40
+ - ml
41
+ - cy
42
+ - sk
43
+ - te
44
+ - fa
45
+ - lv
46
+ - bn
47
+ - sr
48
+ - az
49
+ - sl
50
+ - kn
51
+ - et
52
+ - mk
53
+ - br
54
+ - eu
55
+ - is
56
+ - hy
57
+ - ne
58
+ - mn
59
+ - bs
60
+ - kk
61
+ - sq
62
+ - sw
63
+ - gl
64
+ - mr
65
+ - pa
66
+ - si
67
+ - km
68
+ - sn
69
+ - yo
70
+ - so
71
+ - af
72
+ - oc
73
+ - ka
74
+ - be
75
+ - tg
76
+ - sd
77
+ - gu
78
+ - am
79
+ - yi
80
+ - lo
81
+ - uz
82
+ - fo
83
+ - ht
84
+ - ps
85
+ - tk
86
+ - nn
87
+ - mt
88
+ - sa
89
+ - lb
90
+ - my
91
+ - bo
92
+ - tl
93
+ - mg
94
+ - as
95
+ - tt
96
+ - haw
97
+ - ln
98
+ - ha
99
+ - ba
100
+ - jw
101
+ - su
102
+ tags:
103
+ - audio
104
+ - automatic-speech-recognition
105
+ - hf-asr-leaderboard
106
+ pipeline_tag: automatic-speech-recognition
107
  license: apache-2.0
108
  license_link: https://choosealicense.com/licenses/apache-2.0/
109
  ---
110
+
111
  # whisper-large-v3-fp16-ov
112
+ * Model creator: [OpenAI](https://huggingface.co/openai)
113
  * Original model: [whisper-large-v3](https://huggingface.co/openai/whisper-large-v3)
114
 
115
  ## Description
116
+ This is [whisper-large-v3](https://huggingface.co/openai/whisper-large-v3) model converted to the [OpenVINO™ IR](https://docs.openvino.ai/2025/documentation/openvino-ir-format.html) (Intermediate Representation) format with weights compressed to FP16.
117
 
118
  ## Compatibility
119
 
120
  The provided OpenVINO™ IR model is compatible with:
121
 
122
+ * OpenVINO version 2025.1.0 and higher
123
+ * Optimum Intel 1.23.0 and higher
124
 
125
 
126
  ## Running Model Inference with [Optimum Intel](https://huggingface.co/docs/optimum/intel/index)
 
134
  2. Run model inference:
135
 
136
  ```
137
+ from datasets import load_dataset
138
  from transformers import AutoProcessor
139
  from optimum.intel.openvino import OVModelForSpeechSeq2Seq
140
 
 
145
  dataset = load_dataset("hf-internal-testing/librispeech_asr_dummy", "clean", split="validation", trust_remote_code=True)
146
  sample = dataset[0]
147
 
148
+ input_features = tokenizer(
149
  sample["audio"]["array"],
150
  sampling_rate=sample["audio"]["sampling_rate"],
151
  return_tensors="pt",
152
  ).input_features
153
 
154
  outputs = model.generate(input_features)
155
+ text = tokenizer.batch_decode(outputs)[0]
156
  print(text)
157
  ```
158
 
 
186
  pipe = ov_genai.WhisperPipeline(model_path, device)
187
 
188
  dataset = load_dataset("hf-internal-testing/librispeech_asr_dummy", "clean", split="validation", trust_remote_code=True)
189
+ sample = dataset[0]["audio"]["array"]
190
  print(pipe.generate(sample))
191
  ```
192
 
config.json CHANGED
@@ -1,6 +1,5 @@
1
  {
2
  "_attn_implementation_autoset": true,
3
- "_name_or_path": "OpenVINO/whisper-large-v3-fp16-ov",
4
  "activation_dropout": 0.0,
5
  "activation_function": "gelu",
6
  "apply_spec_augment": false,
@@ -40,7 +39,8 @@
40
  "num_mel_bins": 128,
41
  "pad_token_id": 50256,
42
  "scale_embedding": false,
43
- "transformers_version": "4.46.3",
 
44
  "use_cache": true,
45
  "use_weighted_layer_sum": false,
46
  "vocab_size": 51866
 
1
  {
2
  "_attn_implementation_autoset": true,
 
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
39
  "num_mel_bins": 128,
40
  "pad_token_id": 50256,
41
  "scale_embedding": false,
42
+ "torch_dtype": "float32",
43
+ "transformers_version": "4.51.3",
44
  "use_cache": true,
45
  "use_weighted_layer_sum": false,
46
  "vocab_size": 51866
generation_config.json CHANGED
@@ -261,5 +261,5 @@
261
  "transcribe": 50360,
262
  "translate": 50359
263
  },
264
- "transformers_version": "4.46.3"
265
  }
 
261
  "transcribe": 50360,
262
  "translate": 50359
263
  },
264
+ "transformers_version": "4.51.3"
265
  }
openvino_decoder_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41697c02b031489bad1553d7b60a2d2d4567a02e41c41345ff1e2407c3f51b6f
3
- size 1813043394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c1d1237bc1deb5263c6d1e20557ac3eec7d0f91d7204e9f3fb57ff3f042fd55
3
+ size 3626086568
openvino_decoder_model.xml CHANGED
The diff for this file is too large to render. See raw diff
 
openvino_detokenizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c95aa7a4b53ecb3768d2a6608aa9e419059aef1c75b9b99e6b1c56328281c18
3
- size 528306
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2b3c47825a1089525ff65c0c8e49271e1dee69a401a04fc827ac2de5b7766e4
3
+ size 736198
openvino_detokenizer.xml CHANGED
@@ -1,16 +1,16 @@
1
  <?xml version="1.0"?>
2
  <net name="detokenizer" version="11">
3
  <layers>
4
- <layer id="0" name="Parameter_126105" type="Parameter" version="opset1">
5
  <data shape="?,?" element_type="i64" />
6
  <output>
7
- <port id="0" precision="I64" names="Parameter_126105">
8
  <dim>-1</dim>
9
  <dim>-1</dim>
10
  </port>
11
  </output>
12
  </layer>
13
- <layer id="1" name="Convert_126121" type="Convert" version="opset1">
14
  <data destination_type="i32" />
15
  <input>
16
  <port id="0" precision="I64">
@@ -25,54 +25,59 @@
25
  </port>
26
  </output>
27
  </layer>
28
- <layer id="2" name="Constant_126066" type="Const" version="opset1">
29
- <data element_type="u8" shape="528257" offset="0" size="528257" />
30
  <output>
31
- <port id="0" precision="U8">
32
- <dim>528257</dim>
33
  </port>
34
  </output>
35
  </layer>
36
- <layer id="3" name="StringTensorUnpack_126067" type="StringTensorUnpack" version="extension">
37
- <data mode="begins_ends" />
38
- <input>
39
- <port id="0" precision="U8">
40
- <dim>528257</dim>
41
- </port>
42
- </input>
43
  <output>
44
- <port id="1" precision="I32">
45
- <dim>-1</dim>
46
  </port>
47
- <port id="2" precision="I32">
48
- <dim>-1</dim>
 
 
 
 
 
49
  </port>
50
- <port id="3" precision="U8">
51
- <dim>-1</dim>
 
 
 
 
 
52
  </port>
53
  </output>
54
  </layer>
55
- <layer id="4" name="VocabDecoder_126106" type="VocabDecoder" version="extension">
56
- <data skip_tokens="50257, 50258, 50259, 50260, 50261, 50262, 50263, 50264, 50265, 50266, 50267, 50268, 50269, 50270, 50271, 50272, 50273, 50274, 50275, 50276, 50277, 50278, 50279, 50280, 50281, 50282, 50283, 50284, 50285, 50286, 50287, 50288, 50289, 50290, 50291, 50292, 50293, 50294, 50295, 50296, 50297, 50298, 50299, 50300, 50301, 50302, 50303, 50304, 50305, 50306, 50307, 50308, 50309, 50310, 50311, 50312, 50313, 50314, 50315, 50316, 50317, 50318, 50319, 50320, 50321, 50322, 50323, 50324, 50325, 50326, 50327, 50328, 50329, 50330, 50331, 50332, 50333, 50334, 50335, 50336, 50337, 50338, 50339, 50340, 50341, 50342, 50343, 50344, 50345, 50346, 50347, 50348, 50349, 50350, 50351, 50352, 50353, 50354, 50355, 50356, 50357, 50358, 50359, 50360, 50361, 50362, 50363, 50364" />
57
  <input>
58
  <port id="0" precision="I32">
59
  <dim>-1</dim>
60
  <dim>-1</dim>
61
  </port>
62
  <port id="1" precision="I32">
63
- <dim>-1</dim>
64
  </port>
65
  <port id="2" precision="I32">
66
- <dim>-1</dim>
67
  </port>
68
  <port id="3" precision="U8">
69
- <dim>-1</dim>
70
  </port>
71
- </input>
72
- <output>
73
  <port id="4" precision="I32">
74
- <dim>-1</dim>
75
  </port>
 
 
76
  <port id="5" precision="I32">
77
  <dim>-1</dim>
78
  </port>
@@ -82,12 +87,15 @@
82
  <port id="7" precision="I32">
83
  <dim>-1</dim>
84
  </port>
85
- <port id="8" precision="U8">
 
 
 
86
  <dim>-1</dim>
87
  </port>
88
  </output>
89
  </layer>
90
- <layer id="5" name="FuzeRagged_126107" type="FuzeRagged" version="extension">
91
  <input>
92
  <port id="0" precision="I32">
93
  <dim>-1</dim>
@@ -111,23 +119,48 @@
111
  </port>
112
  </output>
113
  </layer>
114
- <layer id="6" name="Constant_126109" type="Const" version="opset1">
115
- <data element_type="u8" shape="47" offset="528257" size="47" />
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
116
  <output>
117
  <port id="0" precision="U8">
118
- <dim>47</dim>
119
  </port>
120
  </output>
121
  </layer>
122
- <layer id="7" name="Constant_126111" type="Const" version="opset1">
123
- <data element_type="u8" shape="2" offset="528304" size="2" />
124
  <output>
125
  <port id="0" precision="U8">
126
  <dim>2</dim>
127
  </port>
128
  </output>
129
  </layer>
130
- <layer id="8" name="RegexNormalization_126112" type="RegexNormalization" version="extension">
131
  <data global_replace="true" />
132
  <input>
133
  <port id="0" precision="I32">
@@ -140,7 +173,7 @@
140
  <dim>-1</dim>
141
  </port>
142
  <port id="3" precision="U8">
143
- <dim>47</dim>
144
  </port>
145
  <port id="4" precision="U8">
146
  <dim>2</dim>
@@ -158,8 +191,7 @@
158
  </port>
159
  </output>
160
  </layer>
161
- <layer id="9" name="StringTensorPack_126113" type="StringTensorPack" version="extension">
162
- <data mode="begins_ends" />
163
  <input>
164
  <port id="0" precision="I32">
165
  <dim>-1</dim>
@@ -172,12 +204,12 @@
172
  </port>
173
  </input>
174
  <output>
175
- <port id="3" precision="STRING" names="string_output">
176
  <dim>-1</dim>
177
  </port>
178
  </output>
179
  </layer>
180
- <layer id="10" name="Result_126114" type="Result" version="opset1">
181
  <input>
182
  <port id="0" precision="STRING">
183
  <dim>-1</dim>
@@ -187,24 +219,27 @@
187
  </layers>
188
  <edges>
189
  <edge from-layer="0" from-port="0" to-layer="1" to-port="0" />
190
- <edge from-layer="1" from-port="1" to-layer="4" to-port="0" />
191
- <edge from-layer="2" from-port="0" to-layer="3" to-port="0" />
192
- <edge from-layer="3" from-port="1" to-layer="4" to-port="1" />
193
- <edge from-layer="3" from-port="2" to-layer="4" to-port="2" />
194
- <edge from-layer="3" from-port="3" to-layer="4" to-port="3" />
195
- <edge from-layer="4" from-port="7" to-layer="5" to-port="3" />
196
- <edge from-layer="4" from-port="8" to-layer="8" to-port="2" />
197
- <edge from-layer="4" from-port="6" to-layer="5" to-port="2" />
198
- <edge from-layer="4" from-port="5" to-layer="5" to-port="1" />
199
- <edge from-layer="4" from-port="4" to-layer="5" to-port="0" />
200
- <edge from-layer="5" from-port="4" to-layer="8" to-port="0" />
201
- <edge from-layer="5" from-port="5" to-layer="8" to-port="1" />
202
- <edge from-layer="6" from-port="0" to-layer="8" to-port="3" />
203
- <edge from-layer="7" from-port="0" to-layer="8" to-port="4" />
204
- <edge from-layer="8" from-port="5" to-layer="9" to-port="0" />
205
- <edge from-layer="8" from-port="6" to-layer="9" to-port="1" />
206
- <edge from-layer="8" from-port="7" to-layer="9" to-port="2" />
207
- <edge from-layer="9" from-port="3" to-layer="10" to-port="0" />
 
 
 
208
  </edges>
209
  <rt_info>
210
  <add_attention_mask value="True" />
@@ -215,21 +250,22 @@
215
  <detokenizer_input_type value="i64" />
216
  <eos_token_id value="50257" />
217
  <handle_special_tokens_with_re />
 
218
  <number_of_inputs value="1" />
219
- <openvino_tokenizers_version value="2024.5.0.0" />
220
- <openvino_version value="2024.5.0" />
 
221
  <original_tokenizer_class value="&lt;class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
222
  <pad_token_id value="50257" />
223
- <sentencepiece_version value="0.2.0" />
224
  <skip_special_tokens value="True" />
225
  <streaming_detokenizer value="False" />
226
- <tiktoken_version value="0.8.0" />
227
  <tokenizer_output_type value="i64" />
228
- <tokenizers_version value="0.20.3" />
229
- <transformers_version value="4.46.3" />
230
  <use_max_padding value="False" />
231
  <use_sentencepiece_backend value="False" />
232
- <utf8_replace_mode />
233
  <with_detokenizer value="True" />
234
  </rt_info>
235
  </net>
 
1
  <?xml version="1.0"?>
2
  <net name="detokenizer" version="11">
3
  <layers>
4
+ <layer id="0" name="Parameter_83360" type="Parameter" version="opset1">
5
  <data shape="?,?" element_type="i64" />
6
  <output>
7
+ <port id="0" precision="I64" names="Parameter_83360">
8
  <dim>-1</dim>
9
  <dim>-1</dim>
10
  </port>
11
  </output>
12
  </layer>
13
+ <layer id="1" name="Convert_83555" type="Convert" version="opset1">
14
  <data destination_type="i32" />
15
  <input>
16
  <port id="0" precision="I64">
 
25
  </port>
26
  </output>
27
  </layer>
28
+ <layer id="2" name="Constant_83362" type="Const" version="opset1">
29
+ <data element_type="i32" shape="51866" offset="0" size="207464" />
30
  <output>
31
+ <port id="0" precision="I32">
32
+ <dim>51866</dim>
33
  </port>
34
  </output>
35
  </layer>
36
+ <layer id="3" name="Constant_83364" type="Const" version="opset1">
37
+ <data element_type="i32" shape="51866" offset="207464" size="207464" />
 
 
 
 
 
38
  <output>
39
+ <port id="0" precision="I32">
40
+ <dim>51866</dim>
41
  </port>
42
+ </output>
43
+ </layer>
44
+ <layer id="4" name="Constant_83366" type="Const" version="opset1">
45
+ <data element_type="u8" shape="320785" offset="414928" size="320785" />
46
+ <output>
47
+ <port id="0" precision="U8">
48
+ <dim>320785</dim>
49
  </port>
50
+ </output>
51
+ </layer>
52
+ <layer id="5" name="Slice_83371" type="Const" version="opset1">
53
+ <data element_type="i32" shape="108" offset="735713" size="432" />
54
+ <output>
55
+ <port id="0" precision="I32">
56
+ <dim>108</dim>
57
  </port>
58
  </output>
59
  </layer>
60
+ <layer id="6" name="VocabDecoder_83373" type="VocabDecoder" version="extension">
61
+ <data skip_tokens="" />
62
  <input>
63
  <port id="0" precision="I32">
64
  <dim>-1</dim>
65
  <dim>-1</dim>
66
  </port>
67
  <port id="1" precision="I32">
68
+ <dim>51866</dim>
69
  </port>
70
  <port id="2" precision="I32">
71
+ <dim>51866</dim>
72
  </port>
73
  <port id="3" precision="U8">
74
+ <dim>320785</dim>
75
  </port>
 
 
76
  <port id="4" precision="I32">
77
+ <dim>108</dim>
78
  </port>
79
+ </input>
80
+ <output>
81
  <port id="5" precision="I32">
82
  <dim>-1</dim>
83
  </port>
 
87
  <port id="7" precision="I32">
88
  <dim>-1</dim>
89
  </port>
90
+ <port id="8" precision="I32">
91
+ <dim>-1</dim>
92
+ </port>
93
+ <port id="9" precision="U8">
94
  <dim>-1</dim>
95
  </port>
96
  </output>
97
  </layer>
98
+ <layer id="7" name="FuzeRagged_83374" type="FuzeRagged" version="extension">
99
  <input>
100
  <port id="0" precision="I32">
101
  <dim>-1</dim>
 
119
  </port>
120
  </output>
121
  </layer>
122
+ <layer id="8" name="UTF8Validate_83375" type="UTF8Validate" version="extension">
123
+ <data replace_mode="true" />
124
+ <input>
125
+ <port id="0" precision="I32">
126
+ <dim>-1</dim>
127
+ </port>
128
+ <port id="1" precision="I32">
129
+ <dim>-1</dim>
130
+ </port>
131
+ <port id="2" precision="U8">
132
+ <dim>-1</dim>
133
+ </port>
134
+ </input>
135
+ <output>
136
+ <port id="3" precision="I32">
137
+ <dim>-1</dim>
138
+ </port>
139
+ <port id="4" precision="I32">
140
+ <dim>-1</dim>
141
+ </port>
142
+ <port id="5" precision="U8">
143
+ <dim>-1</dim>
144
+ </port>
145
+ </output>
146
+ </layer>
147
+ <layer id="9" name="Constant_83377" type="Const" version="opset1">
148
+ <data element_type="u8" shape="51" offset="736145" size="51" />
149
  <output>
150
  <port id="0" precision="U8">
151
+ <dim>51</dim>
152
  </port>
153
  </output>
154
  </layer>
155
+ <layer id="10" name="Constant_83379" type="Const" version="opset1">
156
+ <data element_type="u8" shape="2" offset="736196" size="2" />
157
  <output>
158
  <port id="0" precision="U8">
159
  <dim>2</dim>
160
  </port>
161
  </output>
162
  </layer>
163
+ <layer id="11" name="RegexNormalization_83380" type="RegexNormalization" version="extension">
164
  <data global_replace="true" />
165
  <input>
166
  <port id="0" precision="I32">
 
173
  <dim>-1</dim>
174
  </port>
175
  <port id="3" precision="U8">
176
+ <dim>51</dim>
177
  </port>
178
  <port id="4" precision="U8">
179
  <dim>2</dim>
 
191
  </port>
192
  </output>
193
  </layer>
194
+ <layer id="12" name="StringTensorPack_83381" type="StringTensorPack" version="opset15">
 
195
  <input>
196
  <port id="0" precision="I32">
197
  <dim>-1</dim>
 
204
  </port>
205
  </input>
206
  <output>
207
+ <port id="3" precision="STRING" names="Result_83382,string_output">
208
  <dim>-1</dim>
209
  </port>
210
  </output>
211
  </layer>
212
+ <layer id="13" name="Result_83382" type="Result" version="opset1" output_names="Result_83382,string_output">
213
  <input>
214
  <port id="0" precision="STRING">
215
  <dim>-1</dim>
 
219
  </layers>
220
  <edges>
221
  <edge from-layer="0" from-port="0" to-layer="1" to-port="0" />
222
+ <edge from-layer="1" from-port="1" to-layer="6" to-port="0" />
223
+ <edge from-layer="2" from-port="0" to-layer="6" to-port="1" />
224
+ <edge from-layer="3" from-port="0" to-layer="6" to-port="2" />
225
+ <edge from-layer="4" from-port="0" to-layer="6" to-port="3" />
226
+ <edge from-layer="5" from-port="0" to-layer="6" to-port="4" />
227
+ <edge from-layer="6" from-port="5" to-layer="7" to-port="0" />
228
+ <edge from-layer="6" from-port="6" to-layer="7" to-port="1" />
229
+ <edge from-layer="6" from-port="7" to-layer="7" to-port="2" />
230
+ <edge from-layer="6" from-port="8" to-layer="7" to-port="3" />
231
+ <edge from-layer="6" from-port="9" to-layer="8" to-port="2" />
232
+ <edge from-layer="7" from-port="5" to-layer="8" to-port="1" />
233
+ <edge from-layer="7" from-port="4" to-layer="8" to-port="0" />
234
+ <edge from-layer="8" from-port="3" to-layer="11" to-port="0" />
235
+ <edge from-layer="8" from-port="4" to-layer="11" to-port="1" />
236
+ <edge from-layer="8" from-port="5" to-layer="11" to-port="2" />
237
+ <edge from-layer="9" from-port="0" to-layer="11" to-port="3" />
238
+ <edge from-layer="10" from-port="0" to-layer="11" to-port="4" />
239
+ <edge from-layer="11" from-port="5" to-layer="12" to-port="0" />
240
+ <edge from-layer="11" from-port="6" to-layer="12" to-port="1" />
241
+ <edge from-layer="11" from-port="7" to-layer="12" to-port="2" />
242
+ <edge from-layer="12" from-port="3" to-layer="13" to-port="0" />
243
  </edges>
244
  <rt_info>
245
  <add_attention_mask value="True" />
 
250
  <detokenizer_input_type value="i64" />
251
  <eos_token_id value="50257" />
252
  <handle_special_tokens_with_re />
253
+ <max_length />
254
  <number_of_inputs value="1" />
255
+ <openvino_tokenizers_version value="2025.2.0.0-565-130827ab189" />
256
+ <openvino_version value="2025.2.0-19120-87425bc78ca-releases/2025/2" />
257
+ <original_post_processor_template value="{&quot;type&quot;: &quot;TemplateProcessing&quot;, &quot;single&quot;: [{&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|startoftranscript|>&quot;, &quot;type_id&quot;: 0}}, {&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|notimestamps|>&quot;, &quot;type_id&quot;: 0}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;A&quot;, &quot;type_id&quot;: 0}}, {&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|endoftext|>&quot;, &quot;type_id&quot;: 0}}], &quot;pair&quot;: [{&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|startoftranscript|>&quot;, &quot;type_id&quot;: 0}}, {&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|notimestamps|>&quot;, &quot;type_id&quot;: 0}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;A&quot;, &quot;type_id&quot;: 0}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;B&quot;, &quot;type_id&quot;: 1}}, {&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|endoftext|>&quot;, &quot;type_id&quot;: 1}}], &quot;special_tokens&quot;: {&quot;&lt;|endoftext|>&quot;: {&quot;id&quot;: &quot;&lt;|endoftext|>&quot;, &quot;ids&quot;: [50257], &quot;tokens&quot;: [&quot;&lt;|endoftext|>&quot;]}, &quot;&lt;|notimestamps|>&quot;: {&quot;id&quot;: &quot;&lt;|notimestamps|>&quot;, &quot;ids&quot;: [50364], &quot;tokens&quot;: [&quot;&lt;|notimestamps|>&quot;]}, &quot;&lt;|startoftranscript|>&quot;: {&quot;id&quot;: &quot;&lt;|startoftranscript|>&quot;, &quot;ids&quot;: [50258], &quot;tokens&quot;: [&quot;&lt;|startoftranscript|>&quot;]}}}" />
258
  <original_tokenizer_class value="&lt;class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
259
  <pad_token_id value="50257" />
260
+ <processed_post_processor_template value="{&quot;single&quot;: {&quot;ids&quot;: [50258, 50364, -1, 50257], &quot;type_ids&quot;: [0, 0, 0, 0]}, &quot;pair&quot;: {&quot;ids&quot;: [50258, 50364, -1, -2, 50257], &quot;type_ids&quot;: [0, 0, 0, 1, 1]}}" />
261
  <skip_special_tokens value="True" />
262
  <streaming_detokenizer value="False" />
 
263
  <tokenizer_output_type value="i64" />
264
+ <tokenizers_version value="0.21.1" />
265
+ <transformers_version value="4.51.3" />
266
  <use_max_padding value="False" />
267
  <use_sentencepiece_backend value="False" />
268
+ <utf8_replace_mode value="replace" />
269
  <with_detokenizer value="True" />
270
  </rt_info>
271
  </net>
openvino_encoder_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:087e741d86bd118bc021c9c61c1e809e865181540faa78fa8dabe00013f2db18
3
- size 1273938020
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9da520da461f014b5df3b64fd8bc25f9ceea83ad47d4f1d07698afe4332dbf7e
3
+ size 2547875940
openvino_encoder_model.xml CHANGED
The diff for this file is too large to render. See raw diff
 
openvino_tokenizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbf72e07d6505915459aae6060bc1e7caba6e8e3be2bae0b2aeb5fd94a00edd1
3
- size 1288293
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b39f55ee479e6dfcd0a2896d0ff386940cdc5dee3fd3ce16e893b2098d32b16
3
+ size 1902189
openvino_tokenizer.xml CHANGED
@@ -1,27 +1,27 @@
1
  <?xml version="1.0"?>
2
  <net name="tokenizer" version="11">
3
  <layers>
4
- <layer id="0" name="Parameter_125985" type="Parameter" version="opset1">
5
  <data shape="?" element_type="string" />
6
  <output>
7
- <port id="0" precision="STRING" names="Parameter_125985">
8
  <dim>-1</dim>
9
  </port>
10
  </output>
11
  </layer>
12
- <layer id="1" name="Constant_126083" type="Const" version="opset1">
13
  <data element_type="i32" shape="" offset="0" size="4" />
14
  <output>
15
  <port id="0" precision="I32" />
16
  </output>
17
  </layer>
18
- <layer id="2" name="Constant_126084" type="Const" version="opset1">
19
  <data element_type="i32" shape="" offset="4" size="4" />
20
  <output>
21
  <port id="0" precision="I32" />
22
  </output>
23
  </layer>
24
- <layer id="3" name="Constant_126085" type="Const" version="opset1">
25
  <data element_type="i32" shape="1" offset="8" size="4" />
26
  <output>
27
  <port id="0" precision="I32">
@@ -29,19 +29,19 @@
29
  </port>
30
  </output>
31
  </layer>
32
- <layer id="4" name="Constant_126086" type="Const" version="opset1">
33
  <data element_type="i32" shape="" offset="0" size="4" />
34
  <output>
35
  <port id="0" precision="I32" />
36
  </output>
37
  </layer>
38
- <layer id="5" name="Constant_126087" type="Const" version="opset1">
39
  <data element_type="i32" shape="" offset="4" size="4" />
40
  <output>
41
  <port id="0" precision="I32" />
42
  </output>
43
  </layer>
44
- <layer id="6" name="Constant_126088" type="Const" version="opset1">
45
  <data element_type="i32" shape="1" offset="12" size="4" />
46
  <output>
47
  <port id="0" precision="I32">
@@ -49,14 +49,13 @@
49
  </port>
50
  </output>
51
  </layer>
52
- <layer id="7" name="Constant_125991" type="Const" version="opset1">
53
  <data element_type="i64" shape="" offset="16" size="8" />
54
  <output>
55
  <port id="0" precision="I64" />
56
  </output>
57
  </layer>
58
- <layer id="8" name="StringTensorUnpack_125986" type="StringTensorUnpack" version="extension">
59
- <data mode="begins_ends" />
60
  <input>
61
  <port id="0" precision="STRING">
62
  <dim>-1</dim>
@@ -74,7 +73,7 @@
74
  </port>
75
  </output>
76
  </layer>
77
- <layer id="9" name="ShapeOf_125987" type="ShapeOf" version="opset3">
78
  <data output_type="i64" />
79
  <input>
80
  <port id="0" precision="I32">
@@ -87,19 +86,19 @@
87
  </port>
88
  </output>
89
  </layer>
90
- <layer id="10" name="Constant_125988" type="Const" version="opset1">
91
  <data element_type="i64" shape="" offset="16" size="8" />
92
  <output>
93
  <port id="0" precision="I64" />
94
  </output>
95
  </layer>
96
- <layer id="11" name="Constant_125989" type="Const" version="opset1">
97
  <data element_type="i64" shape="" offset="16" size="8" />
98
  <output>
99
  <port id="0" precision="I64" />
100
  </output>
101
  </layer>
102
- <layer id="12" name="Gather_125990" type="Gather" version="opset8">
103
  <data batch_dims="0" />
104
  <input>
105
  <port id="0" precision="I64">
@@ -112,13 +111,13 @@
112
  <port id="3" precision="I64" />
113
  </output>
114
  </layer>
115
- <layer id="13" name="Constant_125992" type="Const" version="opset1">
116
  <data element_type="i64" shape="" offset="24" size="8" />
117
  <output>
118
  <port id="0" precision="I64" />
119
  </output>
120
  </layer>
121
- <layer id="14" name="Range_125993" type="Range" version="opset4">
122
  <data output_type="i32" />
123
  <input>
124
  <port id="0" precision="I64" />
@@ -131,19 +130,19 @@
131
  </port>
132
  </output>
133
  </layer>
134
- <layer id="15" name="Constant_125994" type="Const" version="opset1">
135
  <data element_type="i64" shape="" offset="24" size="8" />
136
  <output>
137
  <port id="0" precision="I64" />
138
  </output>
139
  </layer>
140
- <layer id="16" name="Constant_125995" type="Const" version="opset1">
141
  <data element_type="i64" shape="" offset="24" size="8" />
142
  <output>
143
  <port id="0" precision="I64" />
144
  </output>
145
  </layer>
146
- <layer id="17" name="Add_125996" type="Add" version="opset1">
147
  <data auto_broadcast="numpy" />
148
  <input>
149
  <port id="0" precision="I64" />
@@ -153,13 +152,13 @@
153
  <port id="2" precision="I64" />
154
  </output>
155
  </layer>
156
- <layer id="18" name="Constant_125997" type="Const" version="opset1">
157
  <data element_type="i64" shape="" offset="24" size="8" />
158
  <output>
159
  <port id="0" precision="I64" />
160
  </output>
161
  </layer>
162
- <layer id="19" name="Range_125998" type="Range" version="opset4">
163
  <data output_type="i32" />
164
  <input>
165
  <port id="0" precision="I64" />
@@ -172,7 +171,7 @@
172
  </port>
173
  </output>
174
  </layer>
175
- <layer id="20" name="Constant_126060" type="Const" version="opset1">
176
  <data element_type="u8" shape="26491" offset="32" size="26491" />
177
  <output>
178
  <port id="0" precision="U8">
@@ -180,7 +179,7 @@
180
  </port>
181
  </output>
182
  </layer>
183
- <layer id="21" name="SpecialTokensSplit_126061" type="SpecialTokensSplit" version="extension">
184
  <input>
185
  <port id="0" precision="I32">
186
  <dim>-1</dim>
@@ -222,15 +221,15 @@
222
  </port>
223
  </output>
224
  </layer>
225
- <layer id="22" name="Constant_126063" type="Const" version="opset1">
226
- <data element_type="u8" shape="64" offset="26523" size="64" />
227
  <output>
228
  <port id="0" precision="U8">
229
- <dim>64</dim>
230
  </port>
231
  </output>
232
  </layer>
233
- <layer id="23" name="RegexSplit_126064" type="RegexSplit" version="extension">
234
  <data behaviour="isolate" invert="false" max_splits="-1" />
235
  <input>
236
  <port id="0" precision="I32">
@@ -252,7 +251,7 @@
252
  <dim>-1</dim>
253
  </port>
254
  <port id="6" precision="U8">
255
- <dim>64</dim>
256
  </port>
257
  </input>
258
  <output>
@@ -276,123 +275,111 @@
276
  </port>
277
  </output>
278
  </layer>
279
- <layer id="24" name="Constant_126066" type="Const" version="opset1">
280
- <data element_type="u8" shape="528257" offset="26587" size="528257" />
281
  <output>
282
- <port id="0" precision="U8">
283
- <dim>528257</dim>
284
  </port>
285
  </output>
286
  </layer>
287
- <layer id="25" name="StringTensorUnpack_126067" type="StringTensorUnpack" version="extension">
288
- <data mode="begins_ends" />
289
- <input>
290
- <port id="0" precision="U8">
291
- <dim>528257</dim>
292
- </port>
293
- </input>
294
  <output>
295
- <port id="1" precision="I32">
296
- <dim>-1</dim>
297
- </port>
298
- <port id="2" precision="I32">
299
- <dim>-1</dim>
300
- </port>
301
- <port id="3" precision="U8">
302
- <dim>-1</dim>
303
  </port>
304
  </output>
305
  </layer>
306
- <layer id="26" name="Constant_126072" type="Const" version="opset1">
307
- <data element_type="u8" shape="369958" offset="554844" size="369958" />
308
  <output>
309
  <port id="0" precision="U8">
310
- <dim>369958</dim>
311
  </port>
312
  </output>
313
  </layer>
314
- <layer id="27" name="StringTensorUnpack_126073" type="StringTensorUnpack" version="extension">
315
- <data mode="begins_ends" />
316
- <input>
317
- <port id="0" precision="U8">
318
- <dim>369958</dim>
319
- </port>
320
- </input>
321
  <output>
322
- <port id="1" precision="I32">
323
- <dim>-1</dim>
324
- </port>
325
- <port id="2" precision="I32">
326
- <dim>-1</dim>
327
- </port>
328
- <port id="3" precision="U8">
329
- <dim>-1</dim>
330
  </port>
331
  </output>
332
  </layer>
333
- <layer id="28" name="Constant_126075" type="Const" version="opset1">
334
- <data element_type="u8" shape="336859" offset="924802" size="336859" />
335
  <output>
336
- <port id="0" precision="U8">
337
- <dim>336859</dim>
338
  </port>
339
  </output>
340
  </layer>
341
- <layer id="29" name="StringTensorUnpack_126076" type="StringTensorUnpack" version="extension">
342
- <data mode="begins_ends" />
343
- <input>
344
  <port id="0" precision="U8">
345
- <dim>336859</dim>
346
  </port>
347
- </input>
 
 
 
348
  <output>
349
- <port id="1" precision="I32">
350
- <dim>-1</dim>
351
- </port>
352
- <port id="2" precision="I32">
353
- <dim>-1</dim>
354
- </port>
355
- <port id="3" precision="U8">
356
- <dim>-1</dim>
357
  </port>
358
  </output>
359
  </layer>
360
- <layer id="30" name="Constant_126069" type="Const" version="opset1">
361
- <data element_type="u8" shape="20172" offset="1261661" size="20172" />
362
  <output>
363
- <port id="0" precision="U8">
364
- <dim>20172</dim>
365
  </port>
366
  </output>
367
  </layer>
368
- <layer id="31" name="StringTensorUnpack_126070" type="StringTensorUnpack" version="extension">
369
- <data mode="begins_ends" />
370
- <input>
371
  <port id="0" precision="U8">
372
- <dim>20172</dim>
373
  </port>
374
- </input>
 
 
 
375
  <output>
376
- <port id="1" precision="I32">
377
- <dim>-1</dim>
378
  </port>
379
- <port id="2" precision="I32">
380
- <dim>-1</dim>
 
 
 
 
 
381
  </port>
382
- <port id="3" precision="U8">
383
- <dim>-1</dim>
 
 
 
 
 
384
  </port>
385
  </output>
386
  </layer>
387
- <layer id="32" name="Constant_126077" type="Const" version="opset1">
388
- <data element_type="i32" shape="1609" offset="1281833" size="6436" />
389
  <output>
390
  <port id="0" precision="I32">
391
  <dim>1609</dim>
392
  </port>
393
  </output>
394
  </layer>
395
- <layer id="33" name="BPETokenizer_126078" type="BPETokenizer" version="extension">
396
  <data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
397
  <input>
398
  <port id="0" precision="I32">
@@ -411,40 +398,40 @@
411
  <dim>-1</dim>
412
  </port>
413
  <port id="5" precision="I32">
414
- <dim>-1</dim>
415
  </port>
416
  <port id="6" precision="I32">
417
- <dim>-1</dim>
418
  </port>
419
  <port id="7" precision="U8">
420
- <dim>-1</dim>
421
  </port>
422
  <port id="8" precision="I32">
423
- <dim>-1</dim>
424
  </port>
425
  <port id="9" precision="I32">
426
- <dim>-1</dim>
427
  </port>
428
  <port id="10" precision="U8">
429
- <dim>-1</dim>
430
  </port>
431
  <port id="11" precision="I32">
432
- <dim>-1</dim>
433
  </port>
434
  <port id="12" precision="I32">
435
- <dim>-1</dim>
436
  </port>
437
  <port id="13" precision="U8">
438
- <dim>-1</dim>
439
  </port>
440
  <port id="14" precision="I32">
441
- <dim>-1</dim>
442
  </port>
443
  <port id="15" precision="I32">
444
- <dim>-1</dim>
445
  </port>
446
  <port id="16" precision="U8">
447
- <dim>-1</dim>
448
  </port>
449
  <port id="17" precision="I32">
450
  <dim>1609</dim>
@@ -462,44 +449,30 @@
462
  </port>
463
  </output>
464
  </layer>
465
- <layer id="34" name="Subtract_126079" type="Subtract" version="opset1">
466
- <data auto_broadcast="numpy" />
467
- <input>
468
- <port id="0" precision="I32">
469
- <dim>-1</dim>
470
- </port>
471
- <port id="1" precision="I32">
472
- <dim>-1</dim>
473
- </port>
474
- </input>
475
  <output>
476
- <port id="2" precision="I32">
477
- <dim>-1</dim>
478
- </port>
479
  </output>
480
  </layer>
481
- <layer id="35" name="Constant_126080" type="Const" version="opset1">
482
- <data element_type="i32" shape="" offset="1288269" size="4" />
483
  <output>
484
- <port id="0" precision="I32" />
 
 
485
  </output>
486
  </layer>
487
- <layer id="36" name="Minimum_126081" type="Minimum" version="opset1">
488
- <data auto_broadcast="numpy" />
489
- <input>
490
- <port id="0" precision="I32">
491
- <dim>-1</dim>
492
- </port>
493
- <port id="1" precision="I32" />
494
- </input>
495
  <output>
496
- <port id="2" precision="I32">
497
- <dim>-1</dim>
498
  </port>
499
  </output>
500
  </layer>
501
- <layer id="37" name="Add_126082" type="Add" version="opset1">
502
- <data auto_broadcast="numpy" />
503
  <input>
504
  <port id="0" precision="I32">
505
  <dim>-1</dim>
@@ -507,42 +480,58 @@
507
  <port id="1" precision="I32">
508
  <dim>-1</dim>
509
  </port>
 
 
 
 
 
 
 
 
 
 
510
  </input>
511
  <output>
512
- <port id="2" precision="I32">
 
 
 
 
 
 
513
  <dim>-1</dim>
514
  </port>
515
  </output>
516
  </layer>
517
- <layer id="38" name="Constant_126089" type="Const" version="opset1">
518
  <data element_type="i32" shape="" offset="0" size="4" />
519
  <output>
520
  <port id="0" precision="I32" />
521
  </output>
522
  </layer>
523
- <layer id="39" name="Constant_126090" type="Const" version="opset1">
524
  <data element_type="i32" shape="" offset="4" size="4" />
525
  <output>
526
  <port id="0" precision="I32" />
527
  </output>
528
  </layer>
529
- <layer id="40" name="Constant_126091" type="Const" version="opset1">
530
- <data element_type="i32" shape="1" offset="1288273" size="4" />
531
  <output>
532
  <port id="0" precision="I32">
533
  <dim>1</dim>
534
  </port>
535
  </output>
536
  </layer>
537
- <layer id="41" name="Constant_126092" type="Const" version="opset1">
538
- <data element_type="i32" shape="4" offset="1288277" size="16" />
539
  <output>
540
  <port id="0" precision="I32">
541
  <dim>4</dim>
542
  </port>
543
  </output>
544
  </layer>
545
- <layer id="42" name="CombineSegments_126093" type="CombineSegments" version="extension">
546
  <input>
547
  <port id="0" precision="I32" />
548
  <port id="1" precision="I32" />
@@ -593,7 +582,7 @@
593
  </port>
594
  </output>
595
  </layer>
596
- <layer id="43" name="Subtract_126094" type="Subtract" version="opset1">
597
  <data auto_broadcast="numpy" />
598
  <input>
599
  <port id="0" precision="I32">
@@ -609,13 +598,13 @@
609
  </port>
610
  </output>
611
  </layer>
612
- <layer id="44" name="Constant_126095" type="Const" version="opset1">
613
  <data element_type="i32" shape="" offset="0" size="4" />
614
  <output>
615
  <port id="0" precision="I32" />
616
  </output>
617
  </layer>
618
- <layer id="45" name="ReduceMax_126096" type="ReduceMax" version="opset1">
619
  <data keep_dims="false" />
620
  <input>
621
  <port id="0" precision="I32">
@@ -627,14 +616,14 @@
627
  <port id="2" precision="I32" />
628
  </output>
629
  </layer>
630
- <layer id="46" name="Constant_126097" type="Const" version="opset1">
631
- <data element_type="i32" shape="" offset="1288273" size="4" />
632
  <output>
633
  <port id="0" precision="I32" />
634
  </output>
635
  </layer>
636
- <layer id="47" name="RaggedToDense_126098" type="RaggedToDense" version="extension">
637
- <data pad_right="true" />
638
  <input>
639
  <port id="0" precision="I32">
640
  <dim>-1</dim>
@@ -659,7 +648,7 @@
659
  </port>
660
  </output>
661
  </layer>
662
- <layer id="48" name="Convert_126099" type="Convert" version="opset1">
663
  <data destination_type="i32" />
664
  <input>
665
  <port id="0" precision="BOOL">
@@ -674,7 +663,7 @@
674
  </port>
675
  </output>
676
  </layer>
677
- <layer id="49" name="Convert_126099" type="Convert" version="opset1">
678
  <data destination_type="i64" />
679
  <input>
680
  <port id="0" precision="I32">
@@ -689,7 +678,7 @@
689
  </port>
690
  </output>
691
  </layer>
692
- <layer id="51" name="RaggedToDense_126098.0" type="Convert" version="opset1">
693
  <data destination_type="i64" />
694
  <input>
695
  <port id="0" precision="I32">
@@ -704,7 +693,7 @@
704
  </port>
705
  </output>
706
  </layer>
707
- <layer id="52" name="Result_126102" type="Result" version="opset1">
708
  <input>
709
  <port id="0" precision="I64">
710
  <dim>-1</dim>
@@ -712,7 +701,7 @@
712
  </port>
713
  </input>
714
  </layer>
715
- <layer id="50" name="Result_126104" type="Result" version="opset1">
716
  <input>
717
  <port id="0" precision="I64">
718
  <dim>-1</dim>
@@ -723,12 +712,12 @@
723
  </layers>
724
  <edges>
725
  <edge from-layer="0" from-port="0" to-layer="8" to-port="0" />
726
- <edge from-layer="1" from-port="0" to-layer="42" to-port="0" />
727
- <edge from-layer="2" from-port="0" to-layer="42" to-port="1" />
728
- <edge from-layer="3" from-port="0" to-layer="42" to-port="2" />
729
- <edge from-layer="4" from-port="0" to-layer="42" to-port="3" />
730
- <edge from-layer="5" from-port="0" to-layer="42" to-port="4" />
731
- <edge from-layer="6" from-port="0" to-layer="42" to-port="5" />
732
  <edge from-layer="7" from-port="0" to-layer="14" to-port="0" />
733
  <edge from-layer="8" from-port="1" to-layer="9" to-port="0" />
734
  <edge from-layer="8" from-port="3" to-layer="21" to-port="4" />
@@ -737,8 +726,8 @@
737
  <edge from-layer="9" from-port="1" to-layer="12" to-port="0" />
738
  <edge from-layer="10" from-port="0" to-layer="12" to-port="1" />
739
  <edge from-layer="11" from-port="0" to-layer="12" to-port="2" />
740
- <edge from-layer="12" from-port="3" to-layer="14" to-port="1" />
741
  <edge from-layer="12" from-port="3" to-layer="17" to-port="0" />
 
742
  <edge from-layer="13" from-port="0" to-layer="14" to-port="2" />
743
  <edge from-layer="14" from-port="3" to-layer="21" to-port="0" />
744
  <edge from-layer="15" from-port="0" to-layer="19" to-port="0" />
@@ -747,62 +736,58 @@
747
  <edge from-layer="18" from-port="0" to-layer="19" to-port="2" />
748
  <edge from-layer="19" from-port="3" to-layer="21" to-port="1" />
749
  <edge from-layer="20" from-port="0" to-layer="21" to-port="5" />
 
750
  <edge from-layer="21" from-port="7" to-layer="23" to-port="1" />
751
  <edge from-layer="21" from-port="8" to-layer="23" to-port="2" />
752
  <edge from-layer="21" from-port="9" to-layer="23" to-port="3" />
753
  <edge from-layer="21" from-port="10" to-layer="23" to-port="4" />
754
  <edge from-layer="21" from-port="11" to-layer="23" to-port="5" />
755
- <edge from-layer="21" from-port="6" to-layer="23" to-port="0" />
756
  <edge from-layer="22" from-port="0" to-layer="23" to-port="6" />
757
- <edge from-layer="23" from-port="7" to-layer="33" to-port="0" />
758
- <edge from-layer="23" from-port="11" to-layer="33" to-port="4" />
759
- <edge from-layer="23" from-port="10" to-layer="33" to-port="3" />
760
- <edge from-layer="23" from-port="9" to-layer="33" to-port="2" />
761
- <edge from-layer="23" from-port="8" to-layer="33" to-port="1" />
762
- <edge from-layer="24" from-port="0" to-layer="25" to-port="0" />
763
- <edge from-layer="25" from-port="1" to-layer="33" to-port="5" />
764
- <edge from-layer="25" from-port="2" to-layer="33" to-port="6" />
765
- <edge from-layer="25" from-port="3" to-layer="33" to-port="7" />
766
- <edge from-layer="26" from-port="0" to-layer="27" to-port="0" />
767
- <edge from-layer="27" from-port="3" to-layer="33" to-port="10" />
768
- <edge from-layer="27" from-port="1" to-layer="33" to-port="8" />
769
- <edge from-layer="27" from-port="2" to-layer="33" to-port="9" />
770
- <edge from-layer="28" from-port="0" to-layer="29" to-port="0" />
771
- <edge from-layer="29" from-port="3" to-layer="33" to-port="13" />
772
- <edge from-layer="29" from-port="2" to-layer="33" to-port="12" />
773
- <edge from-layer="29" from-port="1" to-layer="33" to-port="11" />
774
- <edge from-layer="30" from-port="0" to-layer="31" to-port="0" />
775
- <edge from-layer="31" from-port="1" to-layer="33" to-port="14" />
776
- <edge from-layer="31" from-port="2" to-layer="33" to-port="15" />
777
- <edge from-layer="31" from-port="3" to-layer="33" to-port="16" />
778
- <edge from-layer="32" from-port="0" to-layer="33" to-port="17" />
779
- <edge from-layer="33" from-port="20" to-layer="42" to-port="8" />
780
- <edge from-layer="33" from-port="18" to-layer="42" to-port="6" />
781
- <edge from-layer="33" from-port="18" to-layer="37" to-port="0" />
782
- <edge from-layer="33" from-port="18" to-layer="34" to-port="1" />
783
- <edge from-layer="33" from-port="19" to-layer="34" to-port="0" />
784
- <edge from-layer="34" from-port="2" to-layer="36" to-port="0" />
785
- <edge from-layer="35" from-port="0" to-layer="36" to-port="1" />
786
- <edge from-layer="36" from-port="2" to-layer="37" to-port="1" />
787
- <edge from-layer="37" from-port="2" to-layer="42" to-port="7" />
788
- <edge from-layer="38" from-port="0" to-layer="42" to-port="9" />
789
- <edge from-layer="39" from-port="0" to-layer="42" to-port="10" />
790
- <edge from-layer="40" from-port="0" to-layer="42" to-port="11" />
791
- <edge from-layer="41" from-port="0" to-layer="42" to-port="12" />
792
- <edge from-layer="42" from-port="13" to-layer="43" to-port="1" />
793
- <edge from-layer="42" from-port="15" to-layer="47" to-port="2" />
794
- <edge from-layer="42" from-port="14" to-layer="47" to-port="1" />
795
- <edge from-layer="42" from-port="13" to-layer="47" to-port="0" />
796
- <edge from-layer="42" from-port="14" to-layer="43" to-port="0" />
797
- <edge from-layer="43" from-port="2" to-layer="45" to-port="0" />
798
- <edge from-layer="44" from-port="0" to-layer="45" to-port="1" />
799
- <edge from-layer="45" from-port="2" to-layer="47" to-port="3" />
800
- <edge from-layer="46" from-port="0" to-layer="47" to-port="4" />
801
- <edge from-layer="47" from-port="6" to-layer="48" to-port="0" />
802
- <edge from-layer="47" from-port="5" to-layer="51" to-port="0" />
803
- <edge from-layer="48" from-port="1" to-layer="49" to-port="0" />
804
- <edge from-layer="49" from-port="1" to-layer="50" to-port="0" />
805
- <edge from-layer="51" from-port="1" to-layer="52" to-port="0" />
806
  </edges>
807
  <rt_info>
808
  <add_attention_mask value="True" />
@@ -813,21 +798,22 @@
813
  <detokenizer_input_type value="i64" />
814
  <eos_token_id value="50257" />
815
  <handle_special_tokens_with_re />
 
816
  <number_of_inputs value="1" />
817
- <openvino_tokenizers_version value="2024.5.0.0" />
818
- <openvino_version value="2024.5.0" />
 
819
  <original_tokenizer_class value="&lt;class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
820
  <pad_token_id value="50257" />
821
- <sentencepiece_version value="0.2.0" />
822
  <skip_special_tokens value="True" />
823
  <streaming_detokenizer value="False" />
824
- <tiktoken_version value="0.8.0" />
825
  <tokenizer_output_type value="i64" />
826
- <tokenizers_version value="0.20.3" />
827
- <transformers_version value="4.46.3" />
828
  <use_max_padding value="False" />
829
  <use_sentencepiece_backend value="False" />
830
- <utf8_replace_mode />
831
  <with_detokenizer value="True" />
832
  </rt_info>
833
  </net>
 
1
  <?xml version="1.0"?>
2
  <net name="tokenizer" version="11">
3
  <layers>
4
+ <layer id="0" name="Parameter_83226" type="Parameter" version="opset1">
5
  <data shape="?" element_type="string" />
6
  <output>
7
+ <port id="0" precision="STRING" names="Parameter_83226">
8
  <dim>-1</dim>
9
  </port>
10
  </output>
11
  </layer>
12
+ <layer id="1" name="Constant_83338" type="Const" version="opset1">
13
  <data element_type="i32" shape="" offset="0" size="4" />
14
  <output>
15
  <port id="0" precision="I32" />
16
  </output>
17
  </layer>
18
+ <layer id="2" name="Constant_83339" type="Const" version="opset1">
19
  <data element_type="i32" shape="" offset="4" size="4" />
20
  <output>
21
  <port id="0" precision="I32" />
22
  </output>
23
  </layer>
24
+ <layer id="3" name="Constant_83340" type="Const" version="opset1">
25
  <data element_type="i32" shape="1" offset="8" size="4" />
26
  <output>
27
  <port id="0" precision="I32">
 
29
  </port>
30
  </output>
31
  </layer>
32
+ <layer id="4" name="Constant_83341" type="Const" version="opset1">
33
  <data element_type="i32" shape="" offset="0" size="4" />
34
  <output>
35
  <port id="0" precision="I32" />
36
  </output>
37
  </layer>
38
+ <layer id="5" name="Constant_83342" type="Const" version="opset1">
39
  <data element_type="i32" shape="" offset="4" size="4" />
40
  <output>
41
  <port id="0" precision="I32" />
42
  </output>
43
  </layer>
44
+ <layer id="6" name="Constant_83343" type="Const" version="opset1">
45
  <data element_type="i32" shape="1" offset="12" size="4" />
46
  <output>
47
  <port id="0" precision="I32">
 
49
  </port>
50
  </output>
51
  </layer>
52
+ <layer id="7" name="Constant_83232" type="Const" version="opset1">
53
  <data element_type="i64" shape="" offset="16" size="8" />
54
  <output>
55
  <port id="0" precision="I64" />
56
  </output>
57
  </layer>
58
+ <layer id="8" name="StringTensorUnpack_83227" type="StringTensorUnpack" version="opset15">
 
59
  <input>
60
  <port id="0" precision="STRING">
61
  <dim>-1</dim>
 
73
  </port>
74
  </output>
75
  </layer>
76
+ <layer id="9" name="ShapeOf_83228" type="ShapeOf" version="opset3">
77
  <data output_type="i64" />
78
  <input>
79
  <port id="0" precision="I32">
 
86
  </port>
87
  </output>
88
  </layer>
89
+ <layer id="10" name="Constant_83229" type="Const" version="opset1">
90
  <data element_type="i64" shape="" offset="16" size="8" />
91
  <output>
92
  <port id="0" precision="I64" />
93
  </output>
94
  </layer>
95
+ <layer id="11" name="Constant_83230" type="Const" version="opset1">
96
  <data element_type="i64" shape="" offset="16" size="8" />
97
  <output>
98
  <port id="0" precision="I64" />
99
  </output>
100
  </layer>
101
+ <layer id="12" name="Gather_83231" type="Gather" version="opset8">
102
  <data batch_dims="0" />
103
  <input>
104
  <port id="0" precision="I64">
 
111
  <port id="3" precision="I64" />
112
  </output>
113
  </layer>
114
+ <layer id="13" name="Constant_83233" type="Const" version="opset1">
115
  <data element_type="i64" shape="" offset="24" size="8" />
116
  <output>
117
  <port id="0" precision="I64" />
118
  </output>
119
  </layer>
120
+ <layer id="14" name="Range_83234" type="Range" version="opset4">
121
  <data output_type="i32" />
122
  <input>
123
  <port id="0" precision="I64" />
 
130
  </port>
131
  </output>
132
  </layer>
133
+ <layer id="15" name="Constant_83235" type="Const" version="opset1">
134
  <data element_type="i64" shape="" offset="24" size="8" />
135
  <output>
136
  <port id="0" precision="I64" />
137
  </output>
138
  </layer>
139
+ <layer id="16" name="Constant_83236" type="Const" version="opset1">
140
  <data element_type="i64" shape="" offset="24" size="8" />
141
  <output>
142
  <port id="0" precision="I64" />
143
  </output>
144
  </layer>
145
+ <layer id="17" name="Add_83237" type="Add" version="opset1">
146
  <data auto_broadcast="numpy" />
147
  <input>
148
  <port id="0" precision="I64" />
 
152
  <port id="2" precision="I64" />
153
  </output>
154
  </layer>
155
+ <layer id="18" name="Constant_83238" type="Const" version="opset1">
156
  <data element_type="i64" shape="" offset="24" size="8" />
157
  <output>
158
  <port id="0" precision="I64" />
159
  </output>
160
  </layer>
161
+ <layer id="19" name="Range_83239" type="Range" version="opset4">
162
  <data output_type="i32" />
163
  <input>
164
  <port id="0" precision="I64" />
 
171
  </port>
172
  </output>
173
  </layer>
174
+ <layer id="20" name="Constant_83301" type="Const" version="opset1">
175
  <data element_type="u8" shape="26491" offset="32" size="26491" />
176
  <output>
177
  <port id="0" precision="U8">
 
179
  </port>
180
  </output>
181
  </layer>
182
+ <layer id="21" name="SpecialTokensSplit_83302" type="SpecialTokensSplit" version="extension">
183
  <input>
184
  <port id="0" precision="I32">
185
  <dim>-1</dim>
 
221
  </port>
222
  </output>
223
  </layer>
224
+ <layer id="22" name="Constant_83304" type="Const" version="opset1">
225
+ <data element_type="u8" shape="74" offset="26523" size="74" />
226
  <output>
227
  <port id="0" precision="U8">
228
+ <dim>74</dim>
229
  </port>
230
  </output>
231
  </layer>
232
+ <layer id="23" name="RegexSplit_83305" type="RegexSplit" version="extension">
233
  <data behaviour="isolate" invert="false" max_splits="-1" />
234
  <input>
235
  <port id="0" precision="I32">
 
251
  <dim>-1</dim>
252
  </port>
253
  <port id="6" precision="U8">
254
+ <dim>74</dim>
255
  </port>
256
  </input>
257
  <output>
 
275
  </port>
276
  </output>
277
  </layer>
278
+ <layer id="24" name="Constant_83307" type="Const" version="opset1">
279
+ <data element_type="i32" shape="51866" offset="26597" size="207464" />
280
  <output>
281
+ <port id="0" precision="I32">
282
+ <dim>51866</dim>
283
  </port>
284
  </output>
285
  </layer>
286
+ <layer id="25" name="Constant_83309" type="Const" version="opset1">
287
+ <data element_type="i32" shape="51866" offset="234061" size="207464" />
 
 
 
 
 
288
  <output>
289
+ <port id="0" precision="I32">
290
+ <dim>51866</dim>
 
 
 
 
 
 
291
  </port>
292
  </output>
293
  </layer>
294
+ <layer id="26" name="Constant_83311" type="Const" version="opset1">
295
+ <data element_type="u8" shape="320785" offset="441525" size="320785" />
296
  <output>
297
  <port id="0" precision="U8">
298
+ <dim>320785</dim>
299
  </port>
300
  </output>
301
  </layer>
302
+ <layer id="27" name="Constant_83319" type="Const" version="opset1">
303
+ <data element_type="i32" shape="50000" offset="762310" size="200000" />
 
 
 
 
 
304
  <output>
305
+ <port id="0" precision="I32">
306
+ <dim>50000</dim>
 
 
 
 
 
 
307
  </port>
308
  </output>
309
  </layer>
310
+ <layer id="28" name="Constant_83321" type="Const" version="opset1">
311
+ <data element_type="i32" shape="50000" offset="962310" size="200000" />
312
  <output>
313
+ <port id="0" precision="I32">
314
+ <dim>50000</dim>
315
  </port>
316
  </output>
317
  </layer>
318
+ <layer id="29" name="Constant_83323" type="Const" version="opset1">
319
+ <data element_type="u8" shape="169950" offset="1162310" size="169950" />
320
+ <output>
321
  <port id="0" precision="U8">
322
+ <dim>169950</dim>
323
  </port>
324
+ </output>
325
+ </layer>
326
+ <layer id="30" name="Constant_83325" type="Const" version="opset1">
327
+ <data element_type="i32" shape="50000" offset="1332260" size="200000" />
328
  <output>
329
+ <port id="0" precision="I32">
330
+ <dim>50000</dim>
 
 
 
 
 
 
331
  </port>
332
  </output>
333
  </layer>
334
+ <layer id="31" name="Constant_83327" type="Const" version="opset1">
335
+ <data element_type="i32" shape="50000" offset="1532260" size="200000" />
336
  <output>
337
+ <port id="0" precision="I32">
338
+ <dim>50000</dim>
339
  </port>
340
  </output>
341
  </layer>
342
+ <layer id="32" name="Constant_83329" type="Const" version="opset1">
343
+ <data element_type="u8" shape="136851" offset="1732260" size="136851" />
344
+ <output>
345
  <port id="0" precision="U8">
346
+ <dim>136851</dim>
347
  </port>
348
+ </output>
349
+ </layer>
350
+ <layer id="33" name="Constant_83313" type="Const" version="opset1">
351
+ <data element_type="i32" shape="1609" offset="1869111" size="6436" />
352
  <output>
353
+ <port id="0" precision="I32">
354
+ <dim>1609</dim>
355
  </port>
356
+ </output>
357
+ </layer>
358
+ <layer id="34" name="Constant_83315" type="Const" version="opset1">
359
+ <data element_type="i32" shape="1609" offset="1875547" size="6436" />
360
+ <output>
361
+ <port id="0" precision="I32">
362
+ <dim>1609</dim>
363
  </port>
364
+ </output>
365
+ </layer>
366
+ <layer id="35" name="Constant_83317" type="Const" version="opset1">
367
+ <data element_type="u8" shape="13728" offset="1881983" size="13728" />
368
+ <output>
369
+ <port id="0" precision="U8">
370
+ <dim>13728</dim>
371
  </port>
372
  </output>
373
  </layer>
374
+ <layer id="36" name="Constant_83330" type="Const" version="opset1">
375
+ <data element_type="i32" shape="1609" offset="1895711" size="6436" />
376
  <output>
377
  <port id="0" precision="I32">
378
  <dim>1609</dim>
379
  </port>
380
  </output>
381
  </layer>
382
+ <layer id="37" name="BPETokenizer_83331" type="BPETokenizer" version="extension">
383
  <data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20000" />
384
  <input>
385
  <port id="0" precision="I32">
 
398
  <dim>-1</dim>
399
  </port>
400
  <port id="5" precision="I32">
401
+ <dim>51866</dim>
402
  </port>
403
  <port id="6" precision="I32">
404
+ <dim>51866</dim>
405
  </port>
406
  <port id="7" precision="U8">
407
+ <dim>320785</dim>
408
  </port>
409
  <port id="8" precision="I32">
410
+ <dim>50000</dim>
411
  </port>
412
  <port id="9" precision="I32">
413
+ <dim>50000</dim>
414
  </port>
415
  <port id="10" precision="U8">
416
+ <dim>169950</dim>
417
  </port>
418
  <port id="11" precision="I32">
419
+ <dim>50000</dim>
420
  </port>
421
  <port id="12" precision="I32">
422
+ <dim>50000</dim>
423
  </port>
424
  <port id="13" precision="U8">
425
+ <dim>136851</dim>
426
  </port>
427
  <port id="14" precision="I32">
428
+ <dim>1609</dim>
429
  </port>
430
  <port id="15" precision="I32">
431
+ <dim>1609</dim>
432
  </port>
433
  <port id="16" precision="U8">
434
+ <dim>13728</dim>
435
  </port>
436
  <port id="17" precision="I32">
437
  <dim>1609</dim>
 
449
  </port>
450
  </output>
451
  </layer>
452
+ <layer id="38" name="Constant_83332" type="Const" version="opset1">
453
+ <data element_type="i32" shape="" offset="1902147" size="4" />
 
 
 
 
 
 
 
 
454
  <output>
455
+ <port id="0" precision="I32" />
 
 
456
  </output>
457
  </layer>
458
+ <layer id="39" name="Constant_83334" type="Const" version="opset1">
459
+ <data element_type="u8" shape="5" offset="1902151" size="5" />
460
  <output>
461
+ <port id="0" precision="U8">
462
+ <dim>5</dim>
463
+ </port>
464
  </output>
465
  </layer>
466
+ <layer id="40" name="Constant_83336" type="Const" version="opset1">
467
+ <data element_type="u8" shape="13" offset="1902156" size="13" />
 
 
 
 
 
 
468
  <output>
469
+ <port id="0" precision="U8">
470
+ <dim>13</dim>
471
  </port>
472
  </output>
473
  </layer>
474
+ <layer id="41" name="Truncate_83337" type="Truncate" version="extension">
475
+ <data m_num_inputs="1" />
476
  <input>
477
  <port id="0" precision="I32">
478
  <dim>-1</dim>
 
480
  <port id="1" precision="I32">
481
  <dim>-1</dim>
482
  </port>
483
+ <port id="2" precision="I32">
484
+ <dim>-1</dim>
485
+ </port>
486
+ <port id="3" precision="I32" />
487
+ <port id="4" precision="U8">
488
+ <dim>5</dim>
489
+ </port>
490
+ <port id="5" precision="U8">
491
+ <dim>13</dim>
492
+ </port>
493
  </input>
494
  <output>
495
+ <port id="6" precision="I32">
496
+ <dim>-1</dim>
497
+ </port>
498
+ <port id="7" precision="I32">
499
+ <dim>-1</dim>
500
+ </port>
501
+ <port id="8" precision="I32">
502
  <dim>-1</dim>
503
  </port>
504
  </output>
505
  </layer>
506
+ <layer id="42" name="Constant_83344" type="Const" version="opset1">
507
  <data element_type="i32" shape="" offset="0" size="4" />
508
  <output>
509
  <port id="0" precision="I32" />
510
  </output>
511
  </layer>
512
+ <layer id="43" name="Constant_83345" type="Const" version="opset1">
513
  <data element_type="i32" shape="" offset="4" size="4" />
514
  <output>
515
  <port id="0" precision="I32" />
516
  </output>
517
  </layer>
518
+ <layer id="44" name="Constant_83346" type="Const" version="opset1">
519
+ <data element_type="i32" shape="1" offset="1902169" size="4" />
520
  <output>
521
  <port id="0" precision="I32">
522
  <dim>1</dim>
523
  </port>
524
  </output>
525
  </layer>
526
+ <layer id="45" name="Constant_83347" type="Const" version="opset1">
527
+ <data element_type="i32" shape="4" offset="1902173" size="16" />
528
  <output>
529
  <port id="0" precision="I32">
530
  <dim>4</dim>
531
  </port>
532
  </output>
533
  </layer>
534
+ <layer id="46" name="CombineSegments_83348" type="CombineSegments" version="extension">
535
  <input>
536
  <port id="0" precision="I32" />
537
  <port id="1" precision="I32" />
 
582
  </port>
583
  </output>
584
  </layer>
585
+ <layer id="47" name="Subtract_83349" type="Subtract" version="opset1">
586
  <data auto_broadcast="numpy" />
587
  <input>
588
  <port id="0" precision="I32">
 
598
  </port>
599
  </output>
600
  </layer>
601
+ <layer id="48" name="Constant_83350" type="Const" version="opset1">
602
  <data element_type="i32" shape="" offset="0" size="4" />
603
  <output>
604
  <port id="0" precision="I32" />
605
  </output>
606
  </layer>
607
+ <layer id="49" name="ReduceMax_83351" type="ReduceMax" version="opset1">
608
  <data keep_dims="false" />
609
  <input>
610
  <port id="0" precision="I32">
 
616
  <port id="2" precision="I32" />
617
  </output>
618
  </layer>
619
+ <layer id="50" name="Constant_83352" type="Const" version="opset1">
620
+ <data element_type="i32" shape="" offset="1902169" size="4" />
621
  <output>
622
  <port id="0" precision="I32" />
623
  </output>
624
  </layer>
625
+ <layer id="51" name="RaggedToDense_83353" type="RaggedToDense" version="extension">
626
+ <data pad_right="true" m_pad_max_length="false" />
627
  <input>
628
  <port id="0" precision="I32">
629
  <dim>-1</dim>
 
648
  </port>
649
  </output>
650
  </layer>
651
+ <layer id="52" name="Convert_83354" type="Convert" version="opset1">
652
  <data destination_type="i32" />
653
  <input>
654
  <port id="0" precision="BOOL">
 
663
  </port>
664
  </output>
665
  </layer>
666
+ <layer id="53" name="Convert_83354.0" type="Convert" version="opset1">
667
  <data destination_type="i64" />
668
  <input>
669
  <port id="0" precision="I32">
 
678
  </port>
679
  </output>
680
  </layer>
681
+ <layer id="55" name="RaggedToDense_83353.0" type="Convert" version="opset1">
682
  <data destination_type="i64" />
683
  <input>
684
  <port id="0" precision="I32">
 
693
  </port>
694
  </output>
695
  </layer>
696
+ <layer id="56" name="Result_83357" type="Result" version="opset1" output_names="input_ids">
697
  <input>
698
  <port id="0" precision="I64">
699
  <dim>-1</dim>
 
701
  </port>
702
  </input>
703
  </layer>
704
+ <layer id="54" name="Result_83359" type="Result" version="opset1" output_names="attention_mask">
705
  <input>
706
  <port id="0" precision="I64">
707
  <dim>-1</dim>
 
712
  </layers>
713
  <edges>
714
  <edge from-layer="0" from-port="0" to-layer="8" to-port="0" />
715
+ <edge from-layer="1" from-port="0" to-layer="46" to-port="0" />
716
+ <edge from-layer="2" from-port="0" to-layer="46" to-port="1" />
717
+ <edge from-layer="3" from-port="0" to-layer="46" to-port="2" />
718
+ <edge from-layer="4" from-port="0" to-layer="46" to-port="3" />
719
+ <edge from-layer="5" from-port="0" to-layer="46" to-port="4" />
720
+ <edge from-layer="6" from-port="0" to-layer="46" to-port="5" />
721
  <edge from-layer="7" from-port="0" to-layer="14" to-port="0" />
722
  <edge from-layer="8" from-port="1" to-layer="9" to-port="0" />
723
  <edge from-layer="8" from-port="3" to-layer="21" to-port="4" />
 
726
  <edge from-layer="9" from-port="1" to-layer="12" to-port="0" />
727
  <edge from-layer="10" from-port="0" to-layer="12" to-port="1" />
728
  <edge from-layer="11" from-port="0" to-layer="12" to-port="2" />
 
729
  <edge from-layer="12" from-port="3" to-layer="17" to-port="0" />
730
+ <edge from-layer="12" from-port="3" to-layer="14" to-port="1" />
731
  <edge from-layer="13" from-port="0" to-layer="14" to-port="2" />
732
  <edge from-layer="14" from-port="3" to-layer="21" to-port="0" />
733
  <edge from-layer="15" from-port="0" to-layer="19" to-port="0" />
 
736
  <edge from-layer="18" from-port="0" to-layer="19" to-port="2" />
737
  <edge from-layer="19" from-port="3" to-layer="21" to-port="1" />
738
  <edge from-layer="20" from-port="0" to-layer="21" to-port="5" />
739
+ <edge from-layer="21" from-port="6" to-layer="23" to-port="0" />
740
  <edge from-layer="21" from-port="7" to-layer="23" to-port="1" />
741
  <edge from-layer="21" from-port="8" to-layer="23" to-port="2" />
742
  <edge from-layer="21" from-port="9" to-layer="23" to-port="3" />
743
  <edge from-layer="21" from-port="10" to-layer="23" to-port="4" />
744
  <edge from-layer="21" from-port="11" to-layer="23" to-port="5" />
 
745
  <edge from-layer="22" from-port="0" to-layer="23" to-port="6" />
746
+ <edge from-layer="23" from-port="9" to-layer="37" to-port="2" />
747
+ <edge from-layer="23" from-port="11" to-layer="37" to-port="4" />
748
+ <edge from-layer="23" from-port="10" to-layer="37" to-port="3" />
749
+ <edge from-layer="23" from-port="8" to-layer="37" to-port="1" />
750
+ <edge from-layer="23" from-port="7" to-layer="37" to-port="0" />
751
+ <edge from-layer="24" from-port="0" to-layer="37" to-port="5" />
752
+ <edge from-layer="25" from-port="0" to-layer="37" to-port="6" />
753
+ <edge from-layer="26" from-port="0" to-layer="37" to-port="7" />
754
+ <edge from-layer="27" from-port="0" to-layer="37" to-port="8" />
755
+ <edge from-layer="28" from-port="0" to-layer="37" to-port="9" />
756
+ <edge from-layer="29" from-port="0" to-layer="37" to-port="10" />
757
+ <edge from-layer="30" from-port="0" to-layer="37" to-port="11" />
758
+ <edge from-layer="31" from-port="0" to-layer="37" to-port="12" />
759
+ <edge from-layer="32" from-port="0" to-layer="37" to-port="13" />
760
+ <edge from-layer="33" from-port="0" to-layer="37" to-port="14" />
761
+ <edge from-layer="34" from-port="0" to-layer="37" to-port="15" />
762
+ <edge from-layer="35" from-port="0" to-layer="37" to-port="16" />
763
+ <edge from-layer="36" from-port="0" to-layer="37" to-port="17" />
764
+ <edge from-layer="37" from-port="19" to-layer="41" to-port="1" />
765
+ <edge from-layer="37" from-port="18" to-layer="41" to-port="0" />
766
+ <edge from-layer="37" from-port="20" to-layer="41" to-port="2" />
767
+ <edge from-layer="38" from-port="0" to-layer="41" to-port="3" />
768
+ <edge from-layer="39" from-port="0" to-layer="41" to-port="4" />
769
+ <edge from-layer="40" from-port="0" to-layer="41" to-port="5" />
770
+ <edge from-layer="41" from-port="6" to-layer="46" to-port="6" />
771
+ <edge from-layer="41" from-port="7" to-layer="46" to-port="7" />
772
+ <edge from-layer="41" from-port="8" to-layer="46" to-port="8" />
773
+ <edge from-layer="42" from-port="0" to-layer="46" to-port="9" />
774
+ <edge from-layer="43" from-port="0" to-layer="46" to-port="10" />
775
+ <edge from-layer="44" from-port="0" to-layer="46" to-port="11" />
776
+ <edge from-layer="45" from-port="0" to-layer="46" to-port="12" />
777
+ <edge from-layer="46" from-port="14" to-layer="47" to-port="0" />
778
+ <edge from-layer="46" from-port="13" to-layer="47" to-port="1" />
779
+ <edge from-layer="46" from-port="13" to-layer="51" to-port="0" />
780
+ <edge from-layer="46" from-port="14" to-layer="51" to-port="1" />
781
+ <edge from-layer="46" from-port="15" to-layer="51" to-port="2" />
782
+ <edge from-layer="47" from-port="2" to-layer="49" to-port="0" />
783
+ <edge from-layer="48" from-port="0" to-layer="49" to-port="1" />
784
+ <edge from-layer="49" from-port="2" to-layer="51" to-port="3" />
785
+ <edge from-layer="50" from-port="0" to-layer="51" to-port="4" />
786
+ <edge from-layer="51" from-port="6" to-layer="52" to-port="0" />
787
+ <edge from-layer="51" from-port="5" to-layer="55" to-port="0" />
788
+ <edge from-layer="52" from-port="1" to-layer="53" to-port="0" />
789
+ <edge from-layer="53" from-port="1" to-layer="54" to-port="0" />
790
+ <edge from-layer="55" from-port="1" to-layer="56" to-port="0" />
 
 
 
 
791
  </edges>
792
  <rt_info>
793
  <add_attention_mask value="True" />
 
798
  <detokenizer_input_type value="i64" />
799
  <eos_token_id value="50257" />
800
  <handle_special_tokens_with_re />
801
+ <max_length />
802
  <number_of_inputs value="1" />
803
+ <openvino_tokenizers_version value="2025.2.0.0-565-130827ab189" />
804
+ <openvino_version value="2025.2.0-19120-87425bc78ca-releases/2025/2" />
805
+ <original_post_processor_template value="{&quot;type&quot;: &quot;TemplateProcessing&quot;, &quot;single&quot;: [{&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|startoftranscript|>&quot;, &quot;type_id&quot;: 0}}, {&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|notimestamps|>&quot;, &quot;type_id&quot;: 0}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;A&quot;, &quot;type_id&quot;: 0}}, {&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|endoftext|>&quot;, &quot;type_id&quot;: 0}}], &quot;pair&quot;: [{&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|startoftranscript|>&quot;, &quot;type_id&quot;: 0}}, {&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|notimestamps|>&quot;, &quot;type_id&quot;: 0}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;A&quot;, &quot;type_id&quot;: 0}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;B&quot;, &quot;type_id&quot;: 1}}, {&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|endoftext|>&quot;, &quot;type_id&quot;: 1}}], &quot;special_tokens&quot;: {&quot;&lt;|endoftext|>&quot;: {&quot;id&quot;: &quot;&lt;|endoftext|>&quot;, &quot;ids&quot;: [50257], &quot;tokens&quot;: [&quot;&lt;|endoftext|>&quot;]}, &quot;&lt;|notimestamps|>&quot;: {&quot;id&quot;: &quot;&lt;|notimestamps|>&quot;, &quot;ids&quot;: [50364], &quot;tokens&quot;: [&quot;&lt;|notimestamps|>&quot;]}, &quot;&lt;|startoftranscript|>&quot;: {&quot;id&quot;: &quot;&lt;|startoftranscript|>&quot;, &quot;ids&quot;: [50258], &quot;tokens&quot;: [&quot;&lt;|startoftranscript|>&quot;]}}}" />
806
  <original_tokenizer_class value="&lt;class 'transformers.models.whisper.tokenization_whisper_fast.WhisperTokenizerFast'>" />
807
  <pad_token_id value="50257" />
808
+ <processed_post_processor_template value="{&quot;single&quot;: {&quot;ids&quot;: [50258, 50364, -1, 50257], &quot;type_ids&quot;: [0, 0, 0, 0]}, &quot;pair&quot;: {&quot;ids&quot;: [50258, 50364, -1, -2, 50257], &quot;type_ids&quot;: [0, 0, 0, 1, 1]}}" />
809
  <skip_special_tokens value="True" />
810
  <streaming_detokenizer value="False" />
 
811
  <tokenizer_output_type value="i64" />
812
+ <tokenizers_version value="0.21.1" />
813
+ <transformers_version value="4.51.3" />
814
  <use_max_padding value="False" />
815
  <use_sentencepiece_backend value="False" />
816
+ <utf8_replace_mode value="replace" />
817
  <with_detokenizer value="True" />
818
  </rt_info>
819
  </net>
preprocessor_config.json CHANGED
@@ -1,5 +1,6 @@
1
  {
2
  "chunk_length": 30,
 
3
  "feature_extractor_type": "WhisperFeatureExtractor",
4
  "feature_size": 128,
5
  "hop_length": 160,
 
1
  {
2
  "chunk_length": 30,
3
+ "dither": 0.0,
4
  "feature_extractor_type": "WhisperFeatureExtractor",
5
  "feature_size": 128,
6
  "hop_length": 160,
tokenizer_config.json CHANGED
@@ -12987,6 +12987,7 @@
12987
  "clean_up_tokenization_spaces": true,
12988
  "eos_token": "<|endoftext|>",
12989
  "errors": "replace",
 
12990
  "model_max_length": 1000000000000000019884624838656,
12991
  "pad_token": "<|endoftext|>",
12992
  "processor_class": "WhisperProcessor",
 
12987
  "clean_up_tokenization_spaces": true,
12988
  "eos_token": "<|endoftext|>",
12989
  "errors": "replace",
12990
+ "extra_special_tokens": {},
12991
  "model_max_length": 1000000000000000019884624838656,
12992
  "pad_token": "<|endoftext|>",
12993
  "processor_class": "WhisperProcessor",