hsuwill000 commited on
Commit
4ff1b9d
·
verified ·
1 Parent(s): de4d203

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
37
+ tokenizer_config.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_attn_implementation_autoset": true,
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": 128001,
10
+ "head_dim": 128,
11
+ "hidden_act": "silu",
12
+ "hidden_size": 4096,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 14336,
15
+ "max_position_embeddings": 131072,
16
+ "mlp_bias": false,
17
+ "model_type": "llama",
18
+ "num_attention_heads": 32,
19
+ "num_hidden_layers": 32,
20
+ "num_key_value_heads": 8,
21
+ "pretraining_tp": 1,
22
+ "rms_norm_eps": 1e-05,
23
+ "rope_scaling": {
24
+ "factor": 8.0,
25
+ "high_freq_factor": 4.0,
26
+ "low_freq_factor": 1.0,
27
+ "original_max_position_embeddings": 8192,
28
+ "rope_type": "llama3"
29
+ },
30
+ "rope_theta": 500000.0,
31
+ "tie_word_embeddings": false,
32
+ "torch_dtype": "bfloat16",
33
+ "transformers_version": "4.51.3",
34
+ "use_cache": false,
35
+ "vocab_size": 188256
36
+ }
generation_config.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 128000,
4
+ "do_sample": true,
5
+ "eos_token_id": [
6
+ 128001,
7
+ 128008,
8
+ 128009
9
+ ],
10
+ "temperature": 0.6,
11
+ "top_p": 0.9,
12
+ "transformers_version": "4.51.3"
13
+ }
openvino_detokenizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87ce11cd7ca7c039ca261232f4dc2706cbed54bac4af7ecbeb6dbc409c360970
3
+ size 2773676
openvino_detokenizer.xml ADDED
@@ -0,0 +1,271 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <?xml version="1.0"?>
2
+ <net name="detokenizer" version="11">
3
+ <layers>
4
+ <layer id="0" name="Parameter_96963" type="Parameter" version="opset1">
5
+ <data shape="?,?" element_type="i64" />
6
+ <output>
7
+ <port id="0" precision="I64" names="Parameter_96963">
8
+ <dim>-1</dim>
9
+ <dim>-1</dim>
10
+ </port>
11
+ </output>
12
+ </layer>
13
+ <layer id="1" name="Convert_97167" type="Convert" version="opset1">
14
+ <data destination_type="i32" />
15
+ <input>
16
+ <port id="0" precision="I64">
17
+ <dim>-1</dim>
18
+ <dim>-1</dim>
19
+ </port>
20
+ </input>
21
+ <output>
22
+ <port id="1" precision="I32">
23
+ <dim>-1</dim>
24
+ <dim>-1</dim>
25
+ </port>
26
+ </output>
27
+ </layer>
28
+ <layer id="2" name="Constant_96965" type="Const" version="opset1">
29
+ <data element_type="i32" shape="188256" offset="0" size="753024" />
30
+ <output>
31
+ <port id="0" precision="I32">
32
+ <dim>188256</dim>
33
+ </port>
34
+ </output>
35
+ </layer>
36
+ <layer id="3" name="Constant_96967" type="Const" version="opset1">
37
+ <data element_type="i32" shape="188256" offset="753024" size="753024" />
38
+ <output>
39
+ <port id="0" precision="I32">
40
+ <dim>188256</dim>
41
+ </port>
42
+ </output>
43
+ </layer>
44
+ <layer id="4" name="Constant_96969" type="Const" version="opset1">
45
+ <data element_type="u8" shape="1266551" offset="1506048" size="1266551" />
46
+ <output>
47
+ <port id="0" precision="U8">
48
+ <dim>1266551</dim>
49
+ </port>
50
+ </output>
51
+ </layer>
52
+ <layer id="5" name="Slice_96974" type="Const" version="opset1">
53
+ <data element_type="i32" shape="256" offset="2772599" size="1024" />
54
+ <output>
55
+ <port id="0" precision="I32">
56
+ <dim>256</dim>
57
+ </port>
58
+ </output>
59
+ </layer>
60
+ <layer id="6" name="VocabDecoder_96976" type="VocabDecoder" version="extension">
61
+ <data skip_tokens="" />
62
+ <input>
63
+ <port id="0" precision="I32">
64
+ <dim>-1</dim>
65
+ <dim>-1</dim>
66
+ </port>
67
+ <port id="1" precision="I32">
68
+ <dim>188256</dim>
69
+ </port>
70
+ <port id="2" precision="I32">
71
+ <dim>188256</dim>
72
+ </port>
73
+ <port id="3" precision="U8">
74
+ <dim>1266551</dim>
75
+ </port>
76
+ <port id="4" precision="I32">
77
+ <dim>256</dim>
78
+ </port>
79
+ </input>
80
+ <output>
81
+ <port id="5" precision="I32">
82
+ <dim>-1</dim>
83
+ </port>
84
+ <port id="6" precision="I32">
85
+ <dim>-1</dim>
86
+ </port>
87
+ <port id="7" precision="I32">
88
+ <dim>-1</dim>
89
+ </port>
90
+ <port id="8" precision="I32">
91
+ <dim>-1</dim>
92
+ </port>
93
+ <port id="9" precision="U8">
94
+ <dim>-1</dim>
95
+ </port>
96
+ </output>
97
+ </layer>
98
+ <layer id="7" name="FuzeRagged_96977" type="FuzeRagged" version="extension">
99
+ <input>
100
+ <port id="0" precision="I32">
101
+ <dim>-1</dim>
102
+ </port>
103
+ <port id="1" precision="I32">
104
+ <dim>-1</dim>
105
+ </port>
106
+ <port id="2" precision="I32">
107
+ <dim>-1</dim>
108
+ </port>
109
+ <port id="3" precision="I32">
110
+ <dim>-1</dim>
111
+ </port>
112
+ </input>
113
+ <output>
114
+ <port id="4" precision="I32">
115
+ <dim>-1</dim>
116
+ </port>
117
+ <port id="5" precision="I32">
118
+ <dim>-1</dim>
119
+ </port>
120
+ </output>
121
+ </layer>
122
+ <layer id="8" name="UTF8Validate_96978" type="UTF8Validate" version="extension">
123
+ <data replace_mode="true" />
124
+ <input>
125
+ <port id="0" precision="I32">
126
+ <dim>-1</dim>
127
+ </port>
128
+ <port id="1" precision="I32">
129
+ <dim>-1</dim>
130
+ </port>
131
+ <port id="2" precision="U8">
132
+ <dim>-1</dim>
133
+ </port>
134
+ </input>
135
+ <output>
136
+ <port id="3" precision="I32">
137
+ <dim>-1</dim>
138
+ </port>
139
+ <port id="4" precision="I32">
140
+ <dim>-1</dim>
141
+ </port>
142
+ <port id="5" precision="U8">
143
+ <dim>-1</dim>
144
+ </port>
145
+ </output>
146
+ </layer>
147
+ <layer id="9" name="Constant_96980" type="Const" version="opset1">
148
+ <data element_type="u8" shape="51" offset="2773623" size="51" />
149
+ <output>
150
+ <port id="0" precision="U8">
151
+ <dim>51</dim>
152
+ </port>
153
+ </output>
154
+ </layer>
155
+ <layer id="10" name="Constant_96982" type="Const" version="opset1">
156
+ <data element_type="u8" shape="2" offset="2773674" size="2" />
157
+ <output>
158
+ <port id="0" precision="U8">
159
+ <dim>2</dim>
160
+ </port>
161
+ </output>
162
+ </layer>
163
+ <layer id="11" name="RegexNormalization_96983" type="RegexNormalization" version="extension">
164
+ <data global_replace="true" />
165
+ <input>
166
+ <port id="0" precision="I32">
167
+ <dim>-1</dim>
168
+ </port>
169
+ <port id="1" precision="I32">
170
+ <dim>-1</dim>
171
+ </port>
172
+ <port id="2" precision="U8">
173
+ <dim>-1</dim>
174
+ </port>
175
+ <port id="3" precision="U8">
176
+ <dim>51</dim>
177
+ </port>
178
+ <port id="4" precision="U8">
179
+ <dim>2</dim>
180
+ </port>
181
+ </input>
182
+ <output>
183
+ <port id="5" precision="I32">
184
+ <dim>-1</dim>
185
+ </port>
186
+ <port id="6" precision="I32">
187
+ <dim>-1</dim>
188
+ </port>
189
+ <port id="7" precision="U8">
190
+ <dim>-1</dim>
191
+ </port>
192
+ </output>
193
+ </layer>
194
+ <layer id="12" name="StringTensorPack_96984" type="StringTensorPack" version="opset15">
195
+ <input>
196
+ <port id="0" precision="I32">
197
+ <dim>-1</dim>
198
+ </port>
199
+ <port id="1" precision="I32">
200
+ <dim>-1</dim>
201
+ </port>
202
+ <port id="2" precision="U8">
203
+ <dim>-1</dim>
204
+ </port>
205
+ </input>
206
+ <output>
207
+ <port id="3" precision="STRING" names="Result_96985,string_output">
208
+ <dim>-1</dim>
209
+ </port>
210
+ </output>
211
+ </layer>
212
+ <layer id="13" name="Result_96985" type="Result" version="opset1" output_names="Result_96985,string_output">
213
+ <input>
214
+ <port id="0" precision="STRING">
215
+ <dim>-1</dim>
216
+ </port>
217
+ </input>
218
+ </layer>
219
+ </layers>
220
+ <edges>
221
+ <edge from-layer="0" from-port="0" to-layer="1" to-port="0" />
222
+ <edge from-layer="1" from-port="1" to-layer="6" to-port="0" />
223
+ <edge from-layer="2" from-port="0" to-layer="6" to-port="1" />
224
+ <edge from-layer="3" from-port="0" to-layer="6" to-port="2" />
225
+ <edge from-layer="4" from-port="0" to-layer="6" to-port="3" />
226
+ <edge from-layer="5" from-port="0" to-layer="6" to-port="4" />
227
+ <edge from-layer="6" from-port="5" to-layer="7" to-port="0" />
228
+ <edge from-layer="6" from-port="6" to-layer="7" to-port="1" />
229
+ <edge from-layer="6" from-port="7" to-layer="7" to-port="2" />
230
+ <edge from-layer="6" from-port="8" to-layer="7" to-port="3" />
231
+ <edge from-layer="6" from-port="9" to-layer="8" to-port="2" />
232
+ <edge from-layer="7" from-port="5" to-layer="8" to-port="1" />
233
+ <edge from-layer="7" from-port="4" to-layer="8" to-port="0" />
234
+ <edge from-layer="8" from-port="3" to-layer="11" to-port="0" />
235
+ <edge from-layer="8" from-port="4" to-layer="11" to-port="1" />
236
+ <edge from-layer="8" from-port="5" to-layer="11" to-port="2" />
237
+ <edge from-layer="9" from-port="0" to-layer="11" to-port="3" />
238
+ <edge from-layer="10" from-port="0" to-layer="11" to-port="4" />
239
+ <edge from-layer="11" from-port="5" to-layer="12" to-port="0" />
240
+ <edge from-layer="11" from-port="6" to-layer="12" to-port="1" />
241
+ <edge from-layer="11" from-port="7" to-layer="12" to-port="2" />
242
+ <edge from-layer="12" from-port="3" to-layer="13" to-port="0" />
243
+ </edges>
244
+ <rt_info>
245
+ <add_attention_mask value="True" />
246
+ <add_prefix_space />
247
+ <add_special_tokens value="True" />
248
+ <bos_token_id value="128000" />
249
+ <chat_template value="{{- bos_token }}&#10;{%- if custom_tools is defined %}&#10; {%- set tools = custom_tools %}&#10;{%- endif %}&#10;{%- if not tools_in_user_message is defined %}&#10; {%- set tools_in_user_message = true %}&#10;{%- endif %}&#10;{%- if not date_string is defined %}&#10; {%- set date_string = &quot;26 Jul 2024&quot; %}&#10;{%- endif %}&#10;{%- if not tools is defined %}&#10; {%- set tools = none %}&#10;{%- endif %}&#10;&#10;{#- This block extracts the system message, so we can slot it into the right place. #}&#10;{%- if messages[0]['role'] == 'system' %}&#10; {%- set system_message = &quot;你是一個來自台灣的AI助理,你的名字是 TAIDE,樂於以台灣人的立場幫助使用者,會用繁體中文回答問題。\n&quot; + messages[0]['content']|trim %}&#10; {%- set messages = messages[1:] %}&#10;{%- else %}&#10; {%- set system_message = &quot;你是一個來自台灣的AI助理,你的名字是 TAIDE,樂於以台灣人的立場幫助使用者,會用繁體中文回答問題。&quot; %}&#10;{%- endif %}&#10;&#10;{#- System message + builtin tools #}&#10;{{- &quot;&lt;|start_header_id|>system&lt;|end_header_id|>\n\n&quot; }}&#10;{%- if builtin_tools is defined or tools is not none %}&#10; {{- &quot;Environment: ipython\n&quot; }}&#10;{%- endif %}&#10;{%- if builtin_tools is defined %}&#10; {{- &quot;Tools: &quot; + builtin_tools | reject('equalto', 'code_interpreter') | join(&quot;, &quot;) + &quot;\n\n&quot;}}&#10;{%- endif %}&#10;{{- &quot;Cutting Knowledge Date: December 2023\n&quot; }}&#10;{{- &quot;Today Date: &quot; + date_string + &quot;\n\n&quot; }}&#10;{%- if tools is not none and not tools_in_user_message %}&#10; {{- &quot;You have access to the following functions. To call a function, please respond with JSON for a function call.&quot; }}&#10; {{- 'Respond in the format {&quot;name&quot;: function name, &quot;parameters&quot;: dictionary of argument name and its value}.' }}&#10; {{- &quot;Do not use variables.\n\n&quot; }}&#10; {%- for t in tools %}&#10; {{- t | tojson(indent=4) }}&#10; {{- &quot;\n\n&quot; }}&#10; {%- endfor %}&#10;{%- endif %}&#10;{{- system_message }}&#10;{{- &quot;&lt;|eot_id|>&quot; }}&#10;&#10;{#- Custom tools are passed in a user message with some extra guidance #}&#10;{%- if tools_in_user_message and not tools is none %}&#10; {#- Extract the first user message so we can plug it in here #}&#10; {%- if messages | length != 0 %}&#10; {%- set first_user_message = messages[0]['content']|trim %}&#10; {%- set messages = messages[1:] %}&#10; {%- else %}&#10; {{- raise_exception(&quot;Cannot put tools in the first user message when there's no first user message!&quot;) }}&#10;{%- endif %}&#10; {{- '&lt;|start_header_id|>user&lt;|end_header_id|>\n\n' -}}&#10; {{- &quot;Given the following functions, please respond with a JSON for a function call &quot; }}&#10; {{- &quot;with its proper arguments that best answers the given prompt.\n\n&quot; }}&#10; {{- 'Respond in the format {&quot;name&quot;: function name, &quot;parameters&quot;: dictionary of argument name and its value}.' }}&#10; {{- &quot;Do not use variables.\n\n&quot; }}&#10; {%- for t in tools %}&#10; {{- t | tojson(indent=4) }}&#10; {{- &quot;\n\n&quot; }}&#10; {%- endfor %}&#10; {{- first_user_message + &quot;&lt;|eot_id|>&quot;}}&#10;{%- endif %}&#10;&#10;{%- for message in messages %}&#10; {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}&#10; {{- '&lt;|start_header_id|>' + message['role'] + '&lt;|end_header_id|>\n\n'+ message['content'] | trim + '&lt;|eot_id|>' }}&#10; {%- elif 'tool_calls' in message %}&#10; {%- if not message.tool_calls|length == 1 %}&#10; {{- raise_exception(&quot;This model only supports single tool-calls at once!&quot;) }}&#10; {%- endif %}&#10; {%- set tool_call = message.tool_calls[0].function %}&#10; {%- if builtin_tools is defined and tool_call.name in builtin_tools %}&#10; {{- '&lt;|start_header_id|>assistant&lt;|end_header_id|>\n\n' -}}&#10; {{- &quot;&lt;|python_tag|>&quot; + tool_call.name + &quot;.call(&quot; }}&#10; {%- for arg_name, arg_val in tool_call.arguments | items %}&#10; {{- arg_name + '=&quot;' + arg_val + '&quot;' }}&#10; {%- if not loop.last %}&#10; {{- &quot;, &quot; }}&#10; {%- endif %}&#10; {%- endfor %}&#10; {{- &quot;)&quot; }}&#10; {%- else %}&#10; {{- '&lt;|start_header_id|>assistant&lt;|end_header_id|>\n\n' -}}&#10; {{- '{&quot;name&quot;: &quot;' + tool_call.name + '&quot;, ' }}&#10; {{- '&quot;parameters&quot;: ' }}&#10; {{- tool_call.arguments | tojson }}&#10; {{- &quot;}&quot; }}&#10; {%- endif %}&#10; {%- if builtin_tools is defined %}&#10; {#- This means we're in ipython mode #}&#10; {{- &quot;&lt;|eom_id|>&quot; }}&#10; {%- else %}&#10; {{- &quot;&lt;|eot_id|>&quot; }}&#10; {%- endif %}&#10; {%- elif message.role == &quot;tool&quot; or message.role == &quot;ipython&quot; %}&#10; {{- &quot;&lt;|start_header_id|>ipython&lt;|end_header_id|>\n\n&quot; }}&#10; {%- if message.content is mapping or message.content is iterable %}&#10; {{- message.content | tojson }}&#10; {%- else %}&#10; {{- message.content }}&#10; {%- endif %}&#10; {{- &quot;&lt;|eot_id|>&quot; }}&#10; {%- endif %}&#10;{%- endfor %}&#10;{%- if add_generation_prompt %}&#10; {{- '&lt;|start_header_id|>assistant&lt;|end_header_id|>\n\n' }}&#10;{%- endif %}&#10;" />
250
+ <clean_up_tokenization_spaces />
251
+ <detokenizer_input_type value="i64" />
252
+ <eos_token_id value="128009" />
253
+ <handle_special_tokens_with_re />
254
+ <max_length />
255
+ <number_of_inputs value="1" />
256
+ <openvino_tokenizers_version value="2025.3.0.0-573-fe3d3b964fb" />
257
+ <openvino_version value="2025.3.0-19357-ef1dae8b89d" />
258
+ <original_post_processor_template value="{&quot;type&quot;: &quot;Sequence&quot;, &quot;processors&quot;: [{&quot;type&quot;: &quot;ByteLevel&quot;, &quot;add_prefix_space&quot;: true, &quot;trim_offsets&quot;: false, &quot;use_regex&quot;: true}, {&quot;type&quot;: &quot;TemplateProcessing&quot;, &quot;single&quot;: [{&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|begin_of_text|>&quot;, &quot;type_id&quot;: 0}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;A&quot;, &quot;type_id&quot;: 0}}], &quot;pair&quot;: [{&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|begin_of_text|>&quot;, &quot;type_id&quot;: 0}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;A&quot;, &quot;type_id&quot;: 0}}, {&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|begin_of_text|>&quot;, &quot;type_id&quot;: 1}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;B&quot;, &quot;type_id&quot;: 1}}], &quot;special_tokens&quot;: {&quot;&lt;|begin_of_text|>&quot;: {&quot;id&quot;: &quot;&lt;|begin_of_text|>&quot;, &quot;ids&quot;: [128000], &quot;tokens&quot;: [&quot;&lt;|begin_of_text|>&quot;]}}}]}" />
259
+ <original_tokenizer_class value="&lt;class 'transformers.tokenization_utils_fast.PreTrainedTokenizerFast'>" />
260
+ <processed_post_processor_template value="{&quot;single&quot;: {&quot;ids&quot;: [128000, -1], &quot;type_ids&quot;: [0, 0]}, &quot;pair&quot;: {&quot;ids&quot;: [128000, -1, 128000, -2], &quot;type_ids&quot;: [0, 0, 1, 1]}}" />
261
+ <skip_special_tokens value="True" />
262
+ <streaming_detokenizer value="False" />
263
+ <tokenizer_output_type value="i64" />
264
+ <tokenizers_version value="0.21.2" />
265
+ <transformers_version value="4.51.3" />
266
+ <use_max_padding value="False" />
267
+ <use_sentencepiece_backend value="False" />
268
+ <utf8_replace_mode value="replace" />
269
+ <with_detokenizer value="True" />
270
+ </rt_info>
271
+ </net>
openvino_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9c891ce3d27cc680ee38c8bcddbf44c039ac01ea062c990881e68f5e5f8e214
3
+ size 5170364060
openvino_model.xml ADDED
The diff for this file is too large to render. See raw diff
 
openvino_tokenizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1474531c1606f63d2c4b0efc79120d37f2bacc6dd6c649ae8f2e5e30dbef9f50
3
+ size 11060896
openvino_tokenizer.xml ADDED
@@ -0,0 +1,763 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <?xml version="1.0"?>
2
+ <net name="tokenizer" version="11">
3
+ <layers>
4
+ <layer id="0" name="Parameter_96833" type="Parameter" version="opset1">
5
+ <data shape="?" element_type="string" />
6
+ <output>
7
+ <port id="0" precision="STRING" names="Parameter_96833">
8
+ <dim>-1</dim>
9
+ </port>
10
+ </output>
11
+ </layer>
12
+ <layer id="1" name="Constant_96947" type="Const" version="opset1">
13
+ <data element_type="i32" shape="" offset="0" size="4" />
14
+ <output>
15
+ <port id="0" precision="I32" />
16
+ </output>
17
+ </layer>
18
+ <layer id="2" name="Constant_96948" type="Const" version="opset1">
19
+ <data element_type="i32" shape="" offset="4" size="4" />
20
+ <output>
21
+ <port id="0" precision="I32" />
22
+ </output>
23
+ </layer>
24
+ <layer id="3" name="Constant_96949" type="Const" version="opset1">
25
+ <data element_type="i32" shape="1" offset="8" size="4" />
26
+ <output>
27
+ <port id="0" precision="I32">
28
+ <dim>1</dim>
29
+ </port>
30
+ </output>
31
+ </layer>
32
+ <layer id="4" name="Constant_96839" type="Const" version="opset1">
33
+ <data element_type="i64" shape="" offset="12" size="8" />
34
+ <output>
35
+ <port id="0" precision="I64" />
36
+ </output>
37
+ </layer>
38
+ <layer id="5" name="StringTensorUnpack_96834" type="StringTensorUnpack" version="opset15">
39
+ <input>
40
+ <port id="0" precision="STRING">
41
+ <dim>-1</dim>
42
+ </port>
43
+ </input>
44
+ <output>
45
+ <port id="1" precision="I32">
46
+ <dim>-1</dim>
47
+ </port>
48
+ <port id="2" precision="I32">
49
+ <dim>-1</dim>
50
+ </port>
51
+ <port id="3" precision="U8">
52
+ <dim>-1</dim>
53
+ </port>
54
+ </output>
55
+ </layer>
56
+ <layer id="6" name="ShapeOf_96835" type="ShapeOf" version="opset3">
57
+ <data output_type="i64" />
58
+ <input>
59
+ <port id="0" precision="I32">
60
+ <dim>-1</dim>
61
+ </port>
62
+ </input>
63
+ <output>
64
+ <port id="1" precision="I64">
65
+ <dim>1</dim>
66
+ </port>
67
+ </output>
68
+ </layer>
69
+ <layer id="7" name="Constant_96836" type="Const" version="opset1">
70
+ <data element_type="i64" shape="" offset="12" size="8" />
71
+ <output>
72
+ <port id="0" precision="I64" />
73
+ </output>
74
+ </layer>
75
+ <layer id="8" name="Constant_96837" type="Const" version="opset1">
76
+ <data element_type="i64" shape="" offset="12" size="8" />
77
+ <output>
78
+ <port id="0" precision="I64" />
79
+ </output>
80
+ </layer>
81
+ <layer id="9" name="Gather_96838" type="Gather" version="opset8">
82
+ <data batch_dims="0" />
83
+ <input>
84
+ <port id="0" precision="I64">
85
+ <dim>1</dim>
86
+ </port>
87
+ <port id="1" precision="I64" />
88
+ <port id="2" precision="I64" />
89
+ </input>
90
+ <output>
91
+ <port id="3" precision="I64" />
92
+ </output>
93
+ </layer>
94
+ <layer id="10" name="Constant_96840" type="Const" version="opset1">
95
+ <data element_type="i64" shape="" offset="20" size="8" />
96
+ <output>
97
+ <port id="0" precision="I64" />
98
+ </output>
99
+ </layer>
100
+ <layer id="11" name="Range_96841" type="Range" version="opset4">
101
+ <data output_type="i32" />
102
+ <input>
103
+ <port id="0" precision="I64" />
104
+ <port id="1" precision="I64" />
105
+ <port id="2" precision="I64" />
106
+ </input>
107
+ <output>
108
+ <port id="3" precision="I32">
109
+ <dim>-1</dim>
110
+ </port>
111
+ </output>
112
+ </layer>
113
+ <layer id="12" name="Constant_96842" type="Const" version="opset1">
114
+ <data element_type="i64" shape="" offset="20" size="8" />
115
+ <output>
116
+ <port id="0" precision="I64" />
117
+ </output>
118
+ </layer>
119
+ <layer id="13" name="Constant_96843" type="Const" version="opset1">
120
+ <data element_type="i64" shape="" offset="20" size="8" />
121
+ <output>
122
+ <port id="0" precision="I64" />
123
+ </output>
124
+ </layer>
125
+ <layer id="14" name="Add_96844" type="Add" version="opset1">
126
+ <data auto_broadcast="numpy" />
127
+ <input>
128
+ <port id="0" precision="I64" />
129
+ <port id="1" precision="I64" />
130
+ </input>
131
+ <output>
132
+ <port id="2" precision="I64" />
133
+ </output>
134
+ </layer>
135
+ <layer id="15" name="Constant_96845" type="Const" version="opset1">
136
+ <data element_type="i64" shape="" offset="20" size="8" />
137
+ <output>
138
+ <port id="0" precision="I64" />
139
+ </output>
140
+ </layer>
141
+ <layer id="16" name="Range_96846" type="Range" version="opset4">
142
+ <data output_type="i32" />
143
+ <input>
144
+ <port id="0" precision="I64" />
145
+ <port id="1" precision="I64" />
146
+ <port id="2" precision="I64" />
147
+ </input>
148
+ <output>
149
+ <port id="3" precision="I32">
150
+ <dim>-1</dim>
151
+ </port>
152
+ </output>
153
+ </layer>
154
+ <layer id="17" name="Constant_96910" type="Const" version="opset1">
155
+ <data element_type="u8" shape="617234" offset="28" size="617234" />
156
+ <output>
157
+ <port id="0" precision="U8">
158
+ <dim>617234</dim>
159
+ </port>
160
+ </output>
161
+ </layer>
162
+ <layer id="18" name="SpecialTokensSplit_96911" type="SpecialTokensSplit" version="extension">
163
+ <input>
164
+ <port id="0" precision="I32">
165
+ <dim>-1</dim>
166
+ </port>
167
+ <port id="1" precision="I32">
168
+ <dim>-1</dim>
169
+ </port>
170
+ <port id="2" precision="I32">
171
+ <dim>-1</dim>
172
+ </port>
173
+ <port id="3" precision="I32">
174
+ <dim>-1</dim>
175
+ </port>
176
+ <port id="4" precision="U8">
177
+ <dim>-1</dim>
178
+ </port>
179
+ <port id="5" precision="U8">
180
+ <dim>617234</dim>
181
+ </port>
182
+ </input>
183
+ <output>
184
+ <port id="6" precision="I32">
185
+ <dim>-1</dim>
186
+ </port>
187
+ <port id="7" precision="I32">
188
+ <dim>-1</dim>
189
+ </port>
190
+ <port id="8" precision="I32">
191
+ <dim>-1</dim>
192
+ </port>
193
+ <port id="9" precision="I32">
194
+ <dim>-1</dim>
195
+ </port>
196
+ <port id="10" precision="U8">
197
+ <dim>-1</dim>
198
+ </port>
199
+ <port id="11" precision="BOOL">
200
+ <dim>-1</dim>
201
+ </port>
202
+ </output>
203
+ </layer>
204
+ <layer id="19" name="Constant_96913" type="Const" version="opset1">
205
+ <data element_type="u8" shape="115" offset="617262" size="115" />
206
+ <output>
207
+ <port id="0" precision="U8">
208
+ <dim>115</dim>
209
+ </port>
210
+ </output>
211
+ </layer>
212
+ <layer id="20" name="RegexSplit_96914" type="RegexSplit" version="extension">
213
+ <data behaviour="isolate" invert="false" max_splits="-1" />
214
+ <input>
215
+ <port id="0" precision="I32">
216
+ <dim>-1</dim>
217
+ </port>
218
+ <port id="1" precision="I32">
219
+ <dim>-1</dim>
220
+ </port>
221
+ <port id="2" precision="I32">
222
+ <dim>-1</dim>
223
+ </port>
224
+ <port id="3" precision="I32">
225
+ <dim>-1</dim>
226
+ </port>
227
+ <port id="4" precision="U8">
228
+ <dim>-1</dim>
229
+ </port>
230
+ <port id="5" precision="BOOL">
231
+ <dim>-1</dim>
232
+ </port>
233
+ <port id="6" precision="U8">
234
+ <dim>115</dim>
235
+ </port>
236
+ </input>
237
+ <output>
238
+ <port id="7" precision="I32">
239
+ <dim>-1</dim>
240
+ </port>
241
+ <port id="8" precision="I32">
242
+ <dim>-1</dim>
243
+ </port>
244
+ <port id="9" precision="I32">
245
+ <dim>-1</dim>
246
+ </port>
247
+ <port id="10" precision="I32">
248
+ <dim>-1</dim>
249
+ </port>
250
+ <port id="11" precision="U8">
251
+ <dim>-1</dim>
252
+ </port>
253
+ <port id="12" precision="BOOL">
254
+ <dim>-1</dim>
255
+ </port>
256
+ </output>
257
+ </layer>
258
+ <layer id="21" name="Constant_96916" type="Const" version="opset1">
259
+ <data element_type="i32" shape="188256" offset="617377" size="753024" />
260
+ <output>
261
+ <port id="0" precision="I32">
262
+ <dim>188256</dim>
263
+ </port>
264
+ </output>
265
+ </layer>
266
+ <layer id="22" name="Constant_96918" type="Const" version="opset1">
267
+ <data element_type="i32" shape="188256" offset="1370401" size="753024" />
268
+ <output>
269
+ <port id="0" precision="I32">
270
+ <dim>188256</dim>
271
+ </port>
272
+ </output>
273
+ </layer>
274
+ <layer id="23" name="Constant_96920" type="Const" version="opset1">
275
+ <data element_type="u8" shape="1266551" offset="2123425" size="1266551" />
276
+ <output>
277
+ <port id="0" precision="U8">
278
+ <dim>1266551</dim>
279
+ </port>
280
+ </output>
281
+ </layer>
282
+ <layer id="24" name="Constant_96928" type="Const" version="opset1">
283
+ <data element_type="i32" shape="280147" offset="3389976" size="1120588" />
284
+ <output>
285
+ <port id="0" precision="I32">
286
+ <dim>280147</dim>
287
+ </port>
288
+ </output>
289
+ </layer>
290
+ <layer id="25" name="Constant_96930" type="Const" version="opset1">
291
+ <data element_type="i32" shape="280147" offset="4510564" size="1120588" />
292
+ <output>
293
+ <port id="0" precision="I32">
294
+ <dim>280147</dim>
295
+ </port>
296
+ </output>
297
+ </layer>
298
+ <layer id="26" name="Constant_96932" type="Const" version="opset1">
299
+ <data element_type="u8" shape="993515" offset="5631152" size="993515" />
300
+ <output>
301
+ <port id="0" precision="U8">
302
+ <dim>993515</dim>
303
+ </port>
304
+ </output>
305
+ </layer>
306
+ <layer id="27" name="Constant_96934" type="Const" version="opset1">
307
+ <data element_type="i32" shape="280147" offset="6624667" size="1120588" />
308
+ <output>
309
+ <port id="0" precision="I32">
310
+ <dim>280147</dim>
311
+ </port>
312
+ </output>
313
+ </layer>
314
+ <layer id="28" name="Constant_96936" type="Const" version="opset1">
315
+ <data element_type="i32" shape="280147" offset="7745255" size="1120588" />
316
+ <output>
317
+ <port id="0" precision="I32">
318
+ <dim>280147</dim>
319
+ </port>
320
+ </output>
321
+ </layer>
322
+ <layer id="29" name="Constant_96938" type="Const" version="opset1">
323
+ <data element_type="u8" shape="1036718" offset="8865843" size="1036718" />
324
+ <output>
325
+ <port id="0" precision="U8">
326
+ <dim>1036718</dim>
327
+ </port>
328
+ </output>
329
+ </layer>
330
+ <layer id="30" name="Constant_96922" type="Const" version="opset1">
331
+ <data element_type="i32" shape="60256" offset="9902561" size="241024" />
332
+ <output>
333
+ <port id="0" precision="I32">
334
+ <dim>60256</dim>
335
+ </port>
336
+ </output>
337
+ </layer>
338
+ <layer id="31" name="Constant_96924" type="Const" version="opset1">
339
+ <data element_type="i32" shape="60256" offset="10143585" size="241024" />
340
+ <output>
341
+ <port id="0" precision="I32">
342
+ <dim>60256</dim>
343
+ </port>
344
+ </output>
345
+ </layer>
346
+ <layer id="32" name="Constant_96926" type="Const" version="opset1">
347
+ <data element_type="u8" shape="435242" offset="10384609" size="435242" />
348
+ <output>
349
+ <port id="0" precision="U8">
350
+ <dim>435242</dim>
351
+ </port>
352
+ </output>
353
+ </layer>
354
+ <layer id="33" name="Constant_96939" type="Const" version="opset1">
355
+ <data element_type="i32" shape="60256" offset="10819851" size="241024" />
356
+ <output>
357
+ <port id="0" precision="I32">
358
+ <dim>60256</dim>
359
+ </port>
360
+ </output>
361
+ </layer>
362
+ <layer id="34" name="BPETokenizer_96940" type="BPETokenizer" version="extension">
363
+ <data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="25600" />
364
+ <input>
365
+ <port id="0" precision="I32">
366
+ <dim>-1</dim>
367
+ </port>
368
+ <port id="1" precision="I32">
369
+ <dim>-1</dim>
370
+ </port>
371
+ <port id="2" precision="I32">
372
+ <dim>-1</dim>
373
+ </port>
374
+ <port id="3" precision="I32">
375
+ <dim>-1</dim>
376
+ </port>
377
+ <port id="4" precision="U8">
378
+ <dim>-1</dim>
379
+ </port>
380
+ <port id="5" precision="I32">
381
+ <dim>188256</dim>
382
+ </port>
383
+ <port id="6" precision="I32">
384
+ <dim>188256</dim>
385
+ </port>
386
+ <port id="7" precision="U8">
387
+ <dim>1266551</dim>
388
+ </port>
389
+ <port id="8" precision="I32">
390
+ <dim>280147</dim>
391
+ </port>
392
+ <port id="9" precision="I32">
393
+ <dim>280147</dim>
394
+ </port>
395
+ <port id="10" precision="U8">
396
+ <dim>993515</dim>
397
+ </port>
398
+ <port id="11" precision="I32">
399
+ <dim>280147</dim>
400
+ </port>
401
+ <port id="12" precision="I32">
402
+ <dim>280147</dim>
403
+ </port>
404
+ <port id="13" precision="U8">
405
+ <dim>1036718</dim>
406
+ </port>
407
+ <port id="14" precision="I32">
408
+ <dim>60256</dim>
409
+ </port>
410
+ <port id="15" precision="I32">
411
+ <dim>60256</dim>
412
+ </port>
413
+ <port id="16" precision="U8">
414
+ <dim>435242</dim>
415
+ </port>
416
+ <port id="17" precision="I32">
417
+ <dim>60256</dim>
418
+ </port>
419
+ </input>
420
+ <output>
421
+ <port id="18" precision="I32">
422
+ <dim>-1</dim>
423
+ </port>
424
+ <port id="19" precision="I32">
425
+ <dim>-1</dim>
426
+ </port>
427
+ <port id="20" precision="I32">
428
+ <dim>-1</dim>
429
+ </port>
430
+ </output>
431
+ </layer>
432
+ <layer id="35" name="Constant_96941" type="Const" version="opset1">
433
+ <data element_type="i32" shape="" offset="11060875" size="4" />
434
+ <output>
435
+ <port id="0" precision="I32" />
436
+ </output>
437
+ </layer>
438
+ <layer id="36" name="Constant_96943" type="Const" version="opset1">
439
+ <data element_type="u8" shape="4" offset="11060879" size="4" />
440
+ <output>
441
+ <port id="0" precision="U8">
442
+ <dim>4</dim>
443
+ </port>
444
+ </output>
445
+ </layer>
446
+ <layer id="37" name="Constant_96945" type="Const" version="opset1">
447
+ <data element_type="u8" shape="13" offset="11060883" size="13" />
448
+ <output>
449
+ <port id="0" precision="U8">
450
+ <dim>13</dim>
451
+ </port>
452
+ </output>
453
+ </layer>
454
+ <layer id="38" name="Truncate_96946" type="Truncate" version="extension">
455
+ <data m_num_inputs="1" />
456
+ <input>
457
+ <port id="0" precision="I32">
458
+ <dim>-1</dim>
459
+ </port>
460
+ <port id="1" precision="I32">
461
+ <dim>-1</dim>
462
+ </port>
463
+ <port id="2" precision="I32">
464
+ <dim>-1</dim>
465
+ </port>
466
+ <port id="3" precision="I32" />
467
+ <port id="4" precision="U8">
468
+ <dim>4</dim>
469
+ </port>
470
+ <port id="5" precision="U8">
471
+ <dim>13</dim>
472
+ </port>
473
+ </input>
474
+ <output>
475
+ <port id="6" precision="I32">
476
+ <dim>-1</dim>
477
+ </port>
478
+ <port id="7" precision="I32">
479
+ <dim>-1</dim>
480
+ </port>
481
+ <port id="8" precision="I32">
482
+ <dim>-1</dim>
483
+ </port>
484
+ </output>
485
+ </layer>
486
+ <layer id="39" name="Constant_96950" type="Const" version="opset1">
487
+ <data element_type="i32" shape="2" offset="12" size="8" />
488
+ <output>
489
+ <port id="0" precision="I32">
490
+ <dim>2</dim>
491
+ </port>
492
+ </output>
493
+ </layer>
494
+ <layer id="40" name="CombineSegments_96951" type="CombineSegments" version="extension">
495
+ <input>
496
+ <port id="0" precision="I32" />
497
+ <port id="1" precision="I32" />
498
+ <port id="2" precision="I32">
499
+ <dim>1</dim>
500
+ </port>
501
+ <port id="3" precision="I32">
502
+ <dim>-1</dim>
503
+ </port>
504
+ <port id="4" precision="I32">
505
+ <dim>-1</dim>
506
+ </port>
507
+ <port id="5" precision="I32">
508
+ <dim>-1</dim>
509
+ </port>
510
+ <port id="6" precision="I32">
511
+ <dim>2</dim>
512
+ </port>
513
+ </input>
514
+ <output>
515
+ <port id="7" precision="I32">
516
+ <dim>-1</dim>
517
+ </port>
518
+ <port id="8" precision="I32">
519
+ <dim>-1</dim>
520
+ </port>
521
+ <port id="9" precision="I32">
522
+ <dim>-1</dim>
523
+ </port>
524
+ <port id="10" precision="I32">
525
+ <dim>-1</dim>
526
+ </port>
527
+ <port id="11" precision="I32">
528
+ <dim>-1</dim>
529
+ </port>
530
+ <port id="12" precision="I32">
531
+ <dim>-1</dim>
532
+ </port>
533
+ </output>
534
+ </layer>
535
+ <layer id="41" name="Subtract_96952" type="Subtract" version="opset1">
536
+ <data auto_broadcast="numpy" />
537
+ <input>
538
+ <port id="0" precision="I32">
539
+ <dim>-1</dim>
540
+ </port>
541
+ <port id="1" precision="I32">
542
+ <dim>-1</dim>
543
+ </port>
544
+ </input>
545
+ <output>
546
+ <port id="2" precision="I32">
547
+ <dim>-1</dim>
548
+ </port>
549
+ </output>
550
+ </layer>
551
+ <layer id="42" name="Constant_96953" type="Const" version="opset1">
552
+ <data element_type="i32" shape="" offset="0" size="4" />
553
+ <output>
554
+ <port id="0" precision="I32" />
555
+ </output>
556
+ </layer>
557
+ <layer id="43" name="ReduceMax_96954" type="ReduceMax" version="opset1">
558
+ <data keep_dims="false" />
559
+ <input>
560
+ <port id="0" precision="I32">
561
+ <dim>-1</dim>
562
+ </port>
563
+ <port id="1" precision="I32" />
564
+ </input>
565
+ <output>
566
+ <port id="2" precision="I32" />
567
+ </output>
568
+ </layer>
569
+ <layer id="44" name="Constant_96955" type="Const" version="opset1">
570
+ <data element_type="i32" shape="" offset="0" size="4" />
571
+ <output>
572
+ <port id="0" precision="I32" />
573
+ </output>
574
+ </layer>
575
+ <layer id="45" name="RaggedToDense_96956" type="RaggedToDense" version="extension">
576
+ <data pad_right="false" m_pad_max_length="false" />
577
+ <input>
578
+ <port id="0" precision="I32">
579
+ <dim>-1</dim>
580
+ </port>
581
+ <port id="1" precision="I32">
582
+ <dim>-1</dim>
583
+ </port>
584
+ <port id="2" precision="I32">
585
+ <dim>-1</dim>
586
+ </port>
587
+ <port id="3" precision="I32" />
588
+ <port id="4" precision="I32" />
589
+ </input>
590
+ <output>
591
+ <port id="5" precision="I32">
592
+ <dim>-1</dim>
593
+ <dim>-1</dim>
594
+ </port>
595
+ <port id="6" precision="BOOL">
596
+ <dim>-1</dim>
597
+ <dim>-1</dim>
598
+ </port>
599
+ </output>
600
+ </layer>
601
+ <layer id="46" name="Convert_96957" type="Convert" version="opset1">
602
+ <data destination_type="i32" />
603
+ <input>
604
+ <port id="0" precision="BOOL">
605
+ <dim>-1</dim>
606
+ <dim>-1</dim>
607
+ </port>
608
+ </input>
609
+ <output>
610
+ <port id="1" precision="I32">
611
+ <dim>-1</dim>
612
+ <dim>-1</dim>
613
+ </port>
614
+ </output>
615
+ </layer>
616
+ <layer id="47" name="Convert_96957.0" type="Convert" version="opset1">
617
+ <data destination_type="i64" />
618
+ <input>
619
+ <port id="0" precision="I32">
620
+ <dim>-1</dim>
621
+ <dim>-1</dim>
622
+ </port>
623
+ </input>
624
+ <output>
625
+ <port id="1" precision="I64" names="attention_mask">
626
+ <dim>-1</dim>
627
+ <dim>-1</dim>
628
+ </port>
629
+ </output>
630
+ </layer>
631
+ <layer id="49" name="RaggedToDense_96956.0" type="Convert" version="opset1">
632
+ <data destination_type="i64" />
633
+ <input>
634
+ <port id="0" precision="I32">
635
+ <dim>-1</dim>
636
+ <dim>-1</dim>
637
+ </port>
638
+ </input>
639
+ <output>
640
+ <port id="1" precision="I64" names="input_ids">
641
+ <dim>-1</dim>
642
+ <dim>-1</dim>
643
+ </port>
644
+ </output>
645
+ </layer>
646
+ <layer id="50" name="Result_96960" type="Result" version="opset1" output_names="input_ids">
647
+ <input>
648
+ <port id="0" precision="I64">
649
+ <dim>-1</dim>
650
+ <dim>-1</dim>
651
+ </port>
652
+ </input>
653
+ </layer>
654
+ <layer id="48" name="Result_96962" type="Result" version="opset1" output_names="attention_mask">
655
+ <input>
656
+ <port id="0" precision="I64">
657
+ <dim>-1</dim>
658
+ <dim>-1</dim>
659
+ </port>
660
+ </input>
661
+ </layer>
662
+ </layers>
663
+ <edges>
664
+ <edge from-layer="0" from-port="0" to-layer="5" to-port="0" />
665
+ <edge from-layer="1" from-port="0" to-layer="40" to-port="0" />
666
+ <edge from-layer="2" from-port="0" to-layer="40" to-port="1" />
667
+ <edge from-layer="3" from-port="0" to-layer="40" to-port="2" />
668
+ <edge from-layer="4" from-port="0" to-layer="11" to-port="0" />
669
+ <edge from-layer="5" from-port="1" to-layer="6" to-port="0" />
670
+ <edge from-layer="5" from-port="3" to-layer="18" to-port="4" />
671
+ <edge from-layer="5" from-port="2" to-layer="18" to-port="3" />
672
+ <edge from-layer="5" from-port="1" to-layer="18" to-port="2" />
673
+ <edge from-layer="6" from-port="1" to-layer="9" to-port="0" />
674
+ <edge from-layer="7" from-port="0" to-layer="9" to-port="1" />
675
+ <edge from-layer="8" from-port="0" to-layer="9" to-port="2" />
676
+ <edge from-layer="9" from-port="3" to-layer="14" to-port="0" />
677
+ <edge from-layer="9" from-port="3" to-layer="11" to-port="1" />
678
+ <edge from-layer="10" from-port="0" to-layer="11" to-port="2" />
679
+ <edge from-layer="11" from-port="3" to-layer="18" to-port="0" />
680
+ <edge from-layer="12" from-port="0" to-layer="16" to-port="0" />
681
+ <edge from-layer="13" from-port="0" to-layer="14" to-port="1" />
682
+ <edge from-layer="14" from-port="2" to-layer="16" to-port="1" />
683
+ <edge from-layer="15" from-port="0" to-layer="16" to-port="2" />
684
+ <edge from-layer="16" from-port="3" to-layer="18" to-port="1" />
685
+ <edge from-layer="17" from-port="0" to-layer="18" to-port="5" />
686
+ <edge from-layer="18" from-port="11" to-layer="20" to-port="5" />
687
+ <edge from-layer="18" from-port="10" to-layer="20" to-port="4" />
688
+ <edge from-layer="18" from-port="9" to-layer="20" to-port="3" />
689
+ <edge from-layer="18" from-port="8" to-layer="20" to-port="2" />
690
+ <edge from-layer="18" from-port="7" to-layer="20" to-port="1" />
691
+ <edge from-layer="18" from-port="6" to-layer="20" to-port="0" />
692
+ <edge from-layer="19" from-port="0" to-layer="20" to-port="6" />
693
+ <edge from-layer="20" from-port="7" to-layer="34" to-port="0" />
694
+ <edge from-layer="20" from-port="8" to-layer="34" to-port="1" />
695
+ <edge from-layer="20" from-port="9" to-layer="34" to-port="2" />
696
+ <edge from-layer="20" from-port="10" to-layer="34" to-port="3" />
697
+ <edge from-layer="20" from-port="11" to-layer="34" to-port="4" />
698
+ <edge from-layer="21" from-port="0" to-layer="34" to-port="5" />
699
+ <edge from-layer="22" from-port="0" to-layer="34" to-port="6" />
700
+ <edge from-layer="23" from-port="0" to-layer="34" to-port="7" />
701
+ <edge from-layer="24" from-port="0" to-layer="34" to-port="8" />
702
+ <edge from-layer="25" from-port="0" to-layer="34" to-port="9" />
703
+ <edge from-layer="26" from-port="0" to-layer="34" to-port="10" />
704
+ <edge from-layer="27" from-port="0" to-layer="34" to-port="11" />
705
+ <edge from-layer="28" from-port="0" to-layer="34" to-port="12" />
706
+ <edge from-layer="29" from-port="0" to-layer="34" to-port="13" />
707
+ <edge from-layer="30" from-port="0" to-layer="34" to-port="14" />
708
+ <edge from-layer="31" from-port="0" to-layer="34" to-port="15" />
709
+ <edge from-layer="32" from-port="0" to-layer="34" to-port="16" />
710
+ <edge from-layer="33" from-port="0" to-layer="34" to-port="17" />
711
+ <edge from-layer="34" from-port="18" to-layer="38" to-port="0" />
712
+ <edge from-layer="34" from-port="19" to-layer="38" to-port="1" />
713
+ <edge from-layer="34" from-port="20" to-layer="38" to-port="2" />
714
+ <edge from-layer="35" from-port="0" to-layer="38" to-port="3" />
715
+ <edge from-layer="36" from-port="0" to-layer="38" to-port="4" />
716
+ <edge from-layer="37" from-port="0" to-layer="38" to-port="5" />
717
+ <edge from-layer="38" from-port="8" to-layer="40" to-port="5" />
718
+ <edge from-layer="38" from-port="6" to-layer="40" to-port="3" />
719
+ <edge from-layer="38" from-port="7" to-layer="40" to-port="4" />
720
+ <edge from-layer="39" from-port="0" to-layer="40" to-port="6" />
721
+ <edge from-layer="40" from-port="8" to-layer="45" to-port="1" />
722
+ <edge from-layer="40" from-port="9" to-layer="45" to-port="2" />
723
+ <edge from-layer="40" from-port="7" to-layer="45" to-port="0" />
724
+ <edge from-layer="40" from-port="7" to-layer="41" to-port="1" />
725
+ <edge from-layer="40" from-port="8" to-layer="41" to-port="0" />
726
+ <edge from-layer="41" from-port="2" to-layer="43" to-port="0" />
727
+ <edge from-layer="42" from-port="0" to-layer="43" to-port="1" />
728
+ <edge from-layer="43" from-port="2" to-layer="45" to-port="3" />
729
+ <edge from-layer="44" from-port="0" to-layer="45" to-port="4" />
730
+ <edge from-layer="45" from-port="6" to-layer="46" to-port="0" />
731
+ <edge from-layer="45" from-port="5" to-layer="49" to-port="0" />
732
+ <edge from-layer="46" from-port="1" to-layer="47" to-port="0" />
733
+ <edge from-layer="47" from-port="1" to-layer="48" to-port="0" />
734
+ <edge from-layer="49" from-port="1" to-layer="50" to-port="0" />
735
+ </edges>
736
+ <rt_info>
737
+ <add_attention_mask value="True" />
738
+ <add_prefix_space />
739
+ <add_special_tokens value="True" />
740
+ <bos_token_id value="128000" />
741
+ <chat_template value="{{- bos_token }}&#10;{%- if custom_tools is defined %}&#10; {%- set tools = custom_tools %}&#10;{%- endif %}&#10;{%- if not tools_in_user_message is defined %}&#10; {%- set tools_in_user_message = true %}&#10;{%- endif %}&#10;{%- if not date_string is defined %}&#10; {%- set date_string = &quot;26 Jul 2024&quot; %}&#10;{%- endif %}&#10;{%- if not tools is defined %}&#10; {%- set tools = none %}&#10;{%- endif %}&#10;&#10;{#- This block extracts the system message, so we can slot it into the right place. #}&#10;{%- if messages[0]['role'] == 'system' %}&#10; {%- set system_message = &quot;你是一個來自台灣的AI助理,你的名字是 TAIDE,樂於以台灣人的立場幫助使用者,會用繁體中文回答問題。\n&quot; + messages[0]['content']|trim %}&#10; {%- set messages = messages[1:] %}&#10;{%- else %}&#10; {%- set system_message = &quot;你是一個來自台灣的AI助理,你的名字是 TAIDE,樂於以台灣人的立場幫助使用者,會用繁體中文回答問題。&quot; %}&#10;{%- endif %}&#10;&#10;{#- System message + builtin tools #}&#10;{{- &quot;&lt;|start_header_id|>system&lt;|end_header_id|>\n\n&quot; }}&#10;{%- if builtin_tools is defined or tools is not none %}&#10; {{- &quot;Environment: ipython\n&quot; }}&#10;{%- endif %}&#10;{%- if builtin_tools is defined %}&#10; {{- &quot;Tools: &quot; + builtin_tools | reject('equalto', 'code_interpreter') | join(&quot;, &quot;) + &quot;\n\n&quot;}}&#10;{%- endif %}&#10;{{- &quot;Cutting Knowledge Date: December 2023\n&quot; }}&#10;{{- &quot;Today Date: &quot; + date_string + &quot;\n\n&quot; }}&#10;{%- if tools is not none and not tools_in_user_message %}&#10; {{- &quot;You have access to the following functions. To call a function, please respond with JSON for a function call.&quot; }}&#10; {{- 'Respond in the format {&quot;name&quot;: function name, &quot;parameters&quot;: dictionary of argument name and its value}.' }}&#10; {{- &quot;Do not use variables.\n\n&quot; }}&#10; {%- for t in tools %}&#10; {{- t | tojson(indent=4) }}&#10; {{- &quot;\n\n&quot; }}&#10; {%- endfor %}&#10;{%- endif %}&#10;{{- system_message }}&#10;{{- &quot;&lt;|eot_id|>&quot; }}&#10;&#10;{#- Custom tools are passed in a user message with some extra guidance #}&#10;{%- if tools_in_user_message and not tools is none %}&#10; {#- Extract the first user message so we can plug it in here #}&#10; {%- if messages | length != 0 %}&#10; {%- set first_user_message = messages[0]['content']|trim %}&#10; {%- set messages = messages[1:] %}&#10; {%- else %}&#10; {{- raise_exception(&quot;Cannot put tools in the first user message when there's no first user message!&quot;) }}&#10;{%- endif %}&#10; {{- '&lt;|start_header_id|>user&lt;|end_header_id|>\n\n' -}}&#10; {{- &quot;Given the following functions, please respond with a JSON for a function call &quot; }}&#10; {{- &quot;with its proper arguments that best answers the given prompt.\n\n&quot; }}&#10; {{- 'Respond in the format {&quot;name&quot;: function name, &quot;parameters&quot;: dictionary of argument name and its value}.' }}&#10; {{- &quot;Do not use variables.\n\n&quot; }}&#10; {%- for t in tools %}&#10; {{- t | tojson(indent=4) }}&#10; {{- &quot;\n\n&quot; }}&#10; {%- endfor %}&#10; {{- first_user_message + &quot;&lt;|eot_id|>&quot;}}&#10;{%- endif %}&#10;&#10;{%- for message in messages %}&#10; {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}&#10; {{- '&lt;|start_header_id|>' + message['role'] + '&lt;|end_header_id|>\n\n'+ message['content'] | trim + '&lt;|eot_id|>' }}&#10; {%- elif 'tool_calls' in message %}&#10; {%- if not message.tool_calls|length == 1 %}&#10; {{- raise_exception(&quot;This model only supports single tool-calls at once!&quot;) }}&#10; {%- endif %}&#10; {%- set tool_call = message.tool_calls[0].function %}&#10; {%- if builtin_tools is defined and tool_call.name in builtin_tools %}&#10; {{- '&lt;|start_header_id|>assistant&lt;|end_header_id|>\n\n' -}}&#10; {{- &quot;&lt;|python_tag|>&quot; + tool_call.name + &quot;.call(&quot; }}&#10; {%- for arg_name, arg_val in tool_call.arguments | items %}&#10; {{- arg_name + '=&quot;' + arg_val + '&quot;' }}&#10; {%- if not loop.last %}&#10; {{- &quot;, &quot; }}&#10; {%- endif %}&#10; {%- endfor %}&#10; {{- &quot;)&quot; }}&#10; {%- else %}&#10; {{- '&lt;|start_header_id|>assistant&lt;|end_header_id|>\n\n' -}}&#10; {{- '{&quot;name&quot;: &quot;' + tool_call.name + '&quot;, ' }}&#10; {{- '&quot;parameters&quot;: ' }}&#10; {{- tool_call.arguments | tojson }}&#10; {{- &quot;}&quot; }}&#10; {%- endif %}&#10; {%- if builtin_tools is defined %}&#10; {#- This means we're in ipython mode #}&#10; {{- &quot;&lt;|eom_id|>&quot; }}&#10; {%- else %}&#10; {{- &quot;&lt;|eot_id|>&quot; }}&#10; {%- endif %}&#10; {%- elif message.role == &quot;tool&quot; or message.role == &quot;ipython&quot; %}&#10; {{- &quot;&lt;|start_header_id|>ipython&lt;|end_header_id|>\n\n&quot; }}&#10; {%- if message.content is mapping or message.content is iterable %}&#10; {{- message.content | tojson }}&#10; {%- else %}&#10; {{- message.content }}&#10; {%- endif %}&#10; {{- &quot;&lt;|eot_id|>&quot; }}&#10; {%- endif %}&#10;{%- endfor %}&#10;{%- if add_generation_prompt %}&#10; {{- '&lt;|start_header_id|>assistant&lt;|end_header_id|>\n\n' }}&#10;{%- endif %}&#10;" />
742
+ <clean_up_tokenization_spaces />
743
+ <detokenizer_input_type value="i64" />
744
+ <eos_token_id value="128009" />
745
+ <handle_special_tokens_with_re />
746
+ <max_length />
747
+ <number_of_inputs value="1" />
748
+ <openvino_tokenizers_version value="2025.3.0.0-573-fe3d3b964fb" />
749
+ <openvino_version value="2025.3.0-19357-ef1dae8b89d" />
750
+ <original_post_processor_template value="{&quot;type&quot;: &quot;Sequence&quot;, &quot;processors&quot;: [{&quot;type&quot;: &quot;ByteLevel&quot;, &quot;add_prefix_space&quot;: true, &quot;trim_offsets&quot;: false, &quot;use_regex&quot;: true}, {&quot;type&quot;: &quot;TemplateProcessing&quot;, &quot;single&quot;: [{&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|begin_of_text|>&quot;, &quot;type_id&quot;: 0}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;A&quot;, &quot;type_id&quot;: 0}}], &quot;pair&quot;: [{&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|begin_of_text|>&quot;, &quot;type_id&quot;: 0}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;A&quot;, &quot;type_id&quot;: 0}}, {&quot;SpecialToken&quot;: {&quot;id&quot;: &quot;&lt;|begin_of_text|>&quot;, &quot;type_id&quot;: 1}}, {&quot;Sequence&quot;: {&quot;id&quot;: &quot;B&quot;, &quot;type_id&quot;: 1}}], &quot;special_tokens&quot;: {&quot;&lt;|begin_of_text|>&quot;: {&quot;id&quot;: &quot;&lt;|begin_of_text|>&quot;, &quot;ids&quot;: [128000], &quot;tokens&quot;: [&quot;&lt;|begin_of_text|>&quot;]}}}]}" />
751
+ <original_tokenizer_class value="&lt;class 'transformers.tokenization_utils_fast.PreTrainedTokenizerFast'>" />
752
+ <processed_post_processor_template value="{&quot;single&quot;: {&quot;ids&quot;: [128000, -1], &quot;type_ids&quot;: [0, 0]}, &quot;pair&quot;: {&quot;ids&quot;: [128000, -1, 128000, -2], &quot;type_ids&quot;: [0, 0, 1, 1]}}" />
753
+ <skip_special_tokens value="True" />
754
+ <streaming_detokenizer value="False" />
755
+ <tokenizer_output_type value="i64" />
756
+ <tokenizers_version value="0.21.2" />
757
+ <transformers_version value="4.51.3" />
758
+ <use_max_padding value="False" />
759
+ <use_sentencepiece_backend value="False" />
760
+ <utf8_replace_mode value="replace" />
761
+ <with_detokenizer value="True" />
762
+ </rt_info>
763
+ </net>
special_tokens_map.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|begin_of_text|>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|eot_id|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ }
16
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28c3050d409c8efc2f75afc12eeec40d3f144a9dcbf29342d51ace4c96f8c283
3
+ size 28257705
tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:417ca5337d0cfc0955e135c6b64f52ecfa95b726b3eeb7d6a10a6c43c2ba81c6
3
+ size 10503452