Echo9Zulu commited on
Commit
2ccab38
·
verified ·
1 Parent(s): 9568375

Upload 15 files

Browse files
config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_function": "silu",
3
+ "architectures": [
4
+ "ExaoneForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "auto_map": {
8
+ "AutoConfig": "configuration_exaone.ExaoneConfig",
9
+ "AutoModelForCausalLM": "modeling_exaone.ExaoneForCausalLM",
10
+ "AutoModelForSequenceClassification": "modeling_exaone.ExaoneForSequenceClassification"
11
+ },
12
+ "bos_token_id": 1,
13
+ "embed_dropout": 0.0,
14
+ "eos_token_id": 361,
15
+ "head_dim": 128,
16
+ "hidden_size": 4096,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 14336,
19
+ "layer_norm_epsilon": 1e-05,
20
+ "max_position_embeddings": 32768,
21
+ "model_type": "exaone",
22
+ "num_attention_heads": 32,
23
+ "num_key_value_heads": 8,
24
+ "num_layers": 32,
25
+ "pad_token_id": 0,
26
+ "rope_scaling": {
27
+ "factor": 8.0,
28
+ "high_freq_factor": 4.0,
29
+ "low_freq_factor": 1.0,
30
+ "original_max_position_embeddings": 8192,
31
+ "rope_type": "llama3"
32
+ },
33
+ "rope_theta": 1000000.0,
34
+ "tie_word_embeddings": false,
35
+ "torch_dtype": "bfloat16",
36
+ "transformers_version": "4.50.2",
37
+ "use_cache": true,
38
+ "vocab_size": 102400
39
+ }
configuration_exaone.py ADDED
@@ -0,0 +1,182 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # coding=utf-8
2
+ # Copyright 2021 The LG AI Research EXAONE Lab. All rights reserved.
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+ """EXAONE model configuration"""
16
+
17
+ from transformers.configuration_utils import PretrainedConfig
18
+ from transformers.utils import logging
19
+
20
+
21
+ logger = logging.get_logger(__name__)
22
+
23
+ EXAONE_PRETRAINED_CONFIG_ARCHIVE_MAP = {}
24
+
25
+
26
+ class ExaoneConfig(PretrainedConfig):
27
+ r"""
28
+ This is the configuration class to store the configuration of a [`ExaoneModel`]. It is used to
29
+ instantiate a EXAONE model according to the specified arguments, defining the model architecture. Instantiating a
30
+ configuration with the defaults will yield a similar configuration to that of the EXAONE-3.0-7.8B-Instruct [LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct](https://huggingface.co/LGAI-EXAONE/EXAONE-3.0-7.8B-Instruct)
31
+
32
+ Configuration objects inherit from [`PretrainedConfig`] and can be used to control the model
33
+ outputs. Read the documentation from [`PretrainedConfig`] for more information.
34
+
35
+
36
+ Args:
37
+ vocab_size (`int`, *optional*, defaults to 102400):
38
+ Vocabulary size of the EXAONE model. Defines the number of different tokens that can be represented by the
39
+ `inputs_ids` passed when calling [`ExaoneModel`]. Vocabulary size of the model.
40
+ Defines the different tokens that can be represented by the `inputs_ids` passed to the forward method of
41
+ [`ExaoneModel`].
42
+ max_position_embeddings (`int`, *optional*, defaults to 2048):
43
+ The maximum sequence length that this model might ever be used with. Typically set this to something large
44
+ just in case (e.g., 512 or 1024 or 2048).
45
+ hidden_size (`int`, *optional*, defaults to 2048):
46
+ Dimensionality of the encoder layers and the pooler layer.
47
+ num_layers (`int`, *optional*, defaults to 32):
48
+ Number of hidden layers in the Transformer encoder.
49
+ num_attention_heads (`int`, *optional*, defaults to 32):
50
+ Number of attention heads for each attention layer in the Transformer decoder.
51
+ num_key_value_heads (`int`, *optional*):
52
+ This is the number of key_value heads that should be used to implement Grouped Query Attention. If
53
+ `num_key_value_heads=num_attention_heads`, the model will use Multi Head Attention (MHA), if
54
+ `num_key_value_heads=1 the model will use Multi Query Attention (MQA) otherwise GQA is used. When
55
+ converting a multi-head checkpoint to a GQA checkpoint, each group key and value head should be constructed
56
+ by meanpooling all the original heads within that group. For more details checkout [this
57
+ paper](https://arxiv.org/pdf/2305.13245.pdf). If it is not specified, will default to
58
+ `num_attention_heads`.
59
+ intermediate_size (`int`, *optional*, defaults to `hidden_size * 4`):
60
+ Dimensionality of the "intermediate" (i.e., feed-forward) layer in the Transformer encoder.
61
+ activation_function (`str` or `function`, *optional*, defaults to `"silu"`):
62
+ The non-linear activation function (function or string) in the decoder.
63
+ rope_theta (`float`, *optional*, defaults to 10000.0):
64
+ The base period of the RoPE embeddings.
65
+ rope_scaling (`Dict`, *optional*):
66
+ Dictionary containing the scaling configuration for the RoPE embeddings. NOTE: if you apply new rope type
67
+ and you expect the model to work on longer `max_position_embeddings`, we recommend you to update this value
68
+ accordingly.
69
+ Expected contents:
70
+ `rope_type` (`str`):
71
+ The sub-variant of RoPE to use. Can be one of ['default', 'linear', 'dynamic', 'yarn', 'longrope',
72
+ 'llama3'], with 'default' being the original RoPE implementation.
73
+ `factor` (`float`, *optional*):
74
+ Used with all rope types except 'default'. The scaling factor to apply to the RoPE embeddings. In
75
+ most scaling types, a `factor` of x will enable the model to handle sequences of length x *
76
+ original maximum pre-trained length.
77
+ `original_max_position_embeddings` (`int`, *optional*):
78
+ Used with 'dynamic', 'longrope' and 'llama3'. The original max position embeddings used during
79
+ pretraining.
80
+ `attention_factor` (`float`, *optional*):
81
+ Used with 'yarn' and 'longrope'. The scaling factor to be applied on the attention
82
+ computation. If unspecified, it defaults to value recommended by the implementation, using the
83
+ `factor` field to infer the suggested value.
84
+ `beta_fast` (`float`, *optional*):
85
+ Only used with 'yarn'. Parameter to set the boundary for extrapolation (only) in the linear
86
+ ramp function. If unspecified, it defaults to 32.
87
+ `beta_slow` (`float`, *optional*):
88
+ Only used with 'yarn'. Parameter to set the boundary for interpolation (only) in the linear
89
+ ramp function. If unspecified, it defaults to 1.
90
+ `short_factor` (`List[float]`, *optional*):
91
+ Only used with 'longrope'. The scaling factor to be applied to short contexts (<
92
+ `original_max_position_embeddings`). Must be a list of numbers with the same length as the hidden
93
+ size divided by the number of attention heads divided by 2
94
+ `long_factor` (`List[float]`, *optional*):
95
+ Only used with 'longrope'. The scaling factor to be applied to long contexts (<
96
+ `original_max_position_embeddings`). Must be a list of numbers with the same length as the hidden
97
+ size divided by the number of attention heads divided by 2
98
+ `low_freq_factor` (`float`, *optional*):
99
+ Only used with 'llama3'. Scaling factor applied to low frequency components of the RoPE
100
+ `high_freq_factor` (`float`, *optional*):
101
+ Only used with 'llama3'. Scaling factor applied to high frequency components of the RoPE
102
+ embed_dropout (`float`, *optional*, defaults to 0.0):
103
+ The dropout probabilitiy for all fully connected layers in the embeddings, encoder, and pooler.
104
+ attention_dropout (`float`, *optional*, defaults to 0.0):
105
+ The dropout ratio for the attention probabilities.
106
+ layer_norm_epsilon (`float`, *optional*, defaults to 1e-05):
107
+ The epsilon used by the layer normalization layers.
108
+ initializer_range (`float`, *optional*, defaults to 0.02):
109
+ The standard deviation of the truncated_normal_initializer for initializing all weight matrices.
110
+ use_cache (`bool`, *optional*, defaults to `True`):
111
+ Whether or not the model should return the last key/values attentions (not used by all models). Only
112
+ relevant if ``config.is_decoder=True``.
113
+ bos_token_id (`int`, *optional*, defaults to 0):
114
+ Beginning of stream token id.
115
+ eos_token_id (`int`, *optional*, defaults to 2):
116
+ End of stream token id.
117
+
118
+ Example:
119
+
120
+ ```python
121
+ >>> from transformers import EXAONEModel, ExaoneConfig
122
+
123
+ >>> # Initializing a EXAONE configuration
124
+ >>> configuration = ExaoneConfig()
125
+
126
+ >>> # Initializing a model from configuration
127
+ >>> model = EXAONEModel(configuration)
128
+
129
+ >>> # Accessing the model configuration
130
+ >>> configuration = model.config
131
+ ```"""
132
+
133
+ model_type = "exaone"
134
+ keys_to_ignore_at_inference = ["past_key_values"]
135
+ attribute_map = {"num_hidden_layers": "num_layers"}
136
+
137
+ def __init__(
138
+ self,
139
+ vocab_size=102400,
140
+ max_position_embeddings=2048,
141
+ hidden_size=2048,
142
+ num_layers=32,
143
+ num_attention_heads=32,
144
+ num_key_value_heads=None,
145
+ intermediate_size=None,
146
+ activation_function="silu",
147
+ rope_theta=10000.0,
148
+ rope_scaling=None,
149
+ embed_dropout=0.0,
150
+ attention_dropout=0.0,
151
+ layer_norm_epsilon=1e-5,
152
+ initializer_range=0.02,
153
+ use_cache=True,
154
+ bos_token_id=0,
155
+ eos_token_id=2,
156
+ **kwargs,
157
+ ):
158
+ self.vocab_size = vocab_size
159
+ self.max_position_embeddings = max_position_embeddings
160
+ self.hidden_size = hidden_size
161
+ self.num_layers = num_layers
162
+ self.num_attention_heads = num_attention_heads
163
+ if num_key_value_heads is None:
164
+ num_key_value_heads = num_attention_heads
165
+ self.num_key_value_heads = num_key_value_heads
166
+ if intermediate_size:
167
+ self.intermediate_size = intermediate_size
168
+ else:
169
+ self.intermediate_size = hidden_size * 4
170
+ self.activation_function = activation_function
171
+ self.embed_dropout = embed_dropout
172
+ self.attention_dropout = attention_dropout
173
+ self.layer_norm_epsilon = layer_norm_epsilon
174
+ self.initializer_range = initializer_range
175
+ self.use_cache = use_cache
176
+ self.rope_theta = rope_theta
177
+ self.rope_scaling = rope_scaling
178
+
179
+ self.bos_token_id = bos_token_id
180
+ self.eos_token_id = eos_token_id
181
+
182
+ super().__init__(bos_token_id=bos_token_id, eos_token_id=eos_token_id, **kwargs)
generation_config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "do_sample": true,
5
+ "eos_token_id": 361,
6
+ "pad_token_id": 0,
7
+ "temperature": 0.6,
8
+ "top_p": 0.95,
9
+ "transformers_version": "4.50.2"
10
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
openvino_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dtype": "int4",
3
+ "input_info": null,
4
+ "optimum_version": "1.25.0.dev0",
5
+ "quantization_config": {
6
+ "all_layers": null,
7
+ "backup_precision": null,
8
+ "bits": 4,
9
+ "dataset": "auto",
10
+ "dtype": "int4",
11
+ "gptq": true,
12
+ "group_size": 128,
13
+ "ignored_scope": null,
14
+ "lora_correction": null,
15
+ "num_samples": null,
16
+ "processor": null,
17
+ "quant_method": "default",
18
+ "ratio": 1.0,
19
+ "scale_estimation": true,
20
+ "sensitivity_metric": null,
21
+ "sym": false,
22
+ "tokenizer": null,
23
+ "trust_remote_code": true
24
+ },
25
+ "save_onnx_model": false,
26
+ "transformers_version": "4.50.2"
27
+ }
openvino_detokenizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:843fef9a3b9d1d85e37f84bdd612b20a87da6e4ffa63ce7fc9ecc1deec95bf78
3
+ size 1105351
openvino_detokenizer.xml ADDED
@@ -0,0 +1,337 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <?xml version="1.0"?>
2
+ <net name="detokenizer" version="11">
3
+ <layers>
4
+ <layer id="0" name="Parameter_2498536" type="Parameter" version="opset1">
5
+ <data shape="?,?" element_type="i64" />
6
+ <output>
7
+ <port id="0" precision="I64" names="Parameter_2498536">
8
+ <dim>-1</dim>
9
+ <dim>-1</dim>
10
+ </port>
11
+ </output>
12
+ </layer>
13
+ <layer id="1" name="Convert_2498557" type="Convert" version="opset1">
14
+ <data destination_type="i32" />
15
+ <input>
16
+ <port id="0" precision="I64">
17
+ <dim>-1</dim>
18
+ <dim>-1</dim>
19
+ </port>
20
+ </input>
21
+ <output>
22
+ <port id="1" precision="I32">
23
+ <dim>-1</dim>
24
+ <dim>-1</dim>
25
+ </port>
26
+ </output>
27
+ </layer>
28
+ <layer id="2" name="Constant_2498511" type="Const" version="opset1">
29
+ <data element_type="u8" shape="1103982" offset="0" size="1103982" />
30
+ <output>
31
+ <port id="0" precision="U8">
32
+ <dim>1103982</dim>
33
+ </port>
34
+ </output>
35
+ </layer>
36
+ <layer id="3" name="StringTensorUnpack_2498512" type="StringTensorUnpack" version="extension">
37
+ <data mode="begins_ends" />
38
+ <input>
39
+ <port id="0" precision="U8">
40
+ <dim>1103982</dim>
41
+ </port>
42
+ </input>
43
+ <output>
44
+ <port id="1" precision="I32">
45
+ <dim>-1</dim>
46
+ </port>
47
+ <port id="2" precision="I32">
48
+ <dim>-1</dim>
49
+ </port>
50
+ <port id="3" precision="U8">
51
+ <dim>-1</dim>
52
+ </port>
53
+ </output>
54
+ </layer>
55
+ <layer id="4" name="Constant_2498540" type="Const" version="opset1">
56
+ <data element_type="i32" shape="324" offset="1103982" size="1296" />
57
+ <output>
58
+ <port id="0" precision="I32">
59
+ <dim>324</dim>
60
+ </port>
61
+ </output>
62
+ </layer>
63
+ <layer id="5" name="Constant_2498538" type="Const" version="opset1">
64
+ <data element_type="i32" shape="1" offset="1105278" size="4" />
65
+ <output>
66
+ <port id="0" precision="I32">
67
+ <dim>1</dim>
68
+ </port>
69
+ </output>
70
+ </layer>
71
+ <layer id="6" name="Constant_2498537" type="Const" version="opset1">
72
+ <data element_type="i32" shape="1" offset="1105282" size="4" />
73
+ <output>
74
+ <port id="0" precision="I32">
75
+ <dim>1</dim>
76
+ </port>
77
+ </output>
78
+ </layer>
79
+ <layer id="7" name="Constant_2498539" type="Const" version="opset1">
80
+ <data element_type="i32" shape="1" offset="1105286" size="4" />
81
+ <output>
82
+ <port id="0" precision="I32">
83
+ <dim>1</dim>
84
+ </port>
85
+ </output>
86
+ </layer>
87
+ <layer id="8" name="Constant_2498542" type="Const" version="opset1">
88
+ <data element_type="i64" shape="1" offset="1105290" size="8" />
89
+ <output>
90
+ <port id="0" precision="I64">
91
+ <dim>1</dim>
92
+ </port>
93
+ </output>
94
+ </layer>
95
+ <layer id="9" name="Slice_2498541" type="Slice" version="opset8">
96
+ <input>
97
+ <port id="0" precision="I32">
98
+ <dim>324</dim>
99
+ </port>
100
+ <port id="1" precision="I32">
101
+ <dim>1</dim>
102
+ </port>
103
+ <port id="2" precision="I32">
104
+ <dim>1</dim>
105
+ </port>
106
+ <port id="3" precision="I32">
107
+ <dim>1</dim>
108
+ </port>
109
+ <port id="4" precision="I64">
110
+ <dim>1</dim>
111
+ </port>
112
+ </input>
113
+ <output>
114
+ <port id="5" precision="I32">
115
+ <dim>324</dim>
116
+ </port>
117
+ </output>
118
+ </layer>
119
+ <layer id="10" name="VocabDecoder_2498543" type="VocabDecoder" version="extension">
120
+ <data skip_tokens="" />
121
+ <input>
122
+ <port id="0" precision="I32">
123
+ <dim>-1</dim>
124
+ <dim>-1</dim>
125
+ </port>
126
+ <port id="1" precision="I32">
127
+ <dim>-1</dim>
128
+ </port>
129
+ <port id="2" precision="I32">
130
+ <dim>-1</dim>
131
+ </port>
132
+ <port id="3" precision="U8">
133
+ <dim>-1</dim>
134
+ </port>
135
+ <port id="4" precision="I32">
136
+ <dim>324</dim>
137
+ </port>
138
+ </input>
139
+ <output>
140
+ <port id="5" precision="I32">
141
+ <dim>-1</dim>
142
+ </port>
143
+ <port id="6" precision="I32">
144
+ <dim>-1</dim>
145
+ </port>
146
+ <port id="7" precision="I32">
147
+ <dim>-1</dim>
148
+ </port>
149
+ <port id="8" precision="I32">
150
+ <dim>-1</dim>
151
+ </port>
152
+ <port id="9" precision="U8">
153
+ <dim>-1</dim>
154
+ </port>
155
+ </output>
156
+ </layer>
157
+ <layer id="11" name="FuzeRagged_2498544" type="FuzeRagged" version="extension">
158
+ <input>
159
+ <port id="0" precision="I32">
160
+ <dim>-1</dim>
161
+ </port>
162
+ <port id="1" precision="I32">
163
+ <dim>-1</dim>
164
+ </port>
165
+ <port id="2" precision="I32">
166
+ <dim>-1</dim>
167
+ </port>
168
+ <port id="3" precision="I32">
169
+ <dim>-1</dim>
170
+ </port>
171
+ </input>
172
+ <output>
173
+ <port id="4" precision="I32">
174
+ <dim>-1</dim>
175
+ </port>
176
+ <port id="5" precision="I32">
177
+ <dim>-1</dim>
178
+ </port>
179
+ </output>
180
+ </layer>
181
+ <layer id="12" name="UTF8Validate_2498545" type="UTF8Validate" version="extension">
182
+ <data replace_mode="true" />
183
+ <input>
184
+ <port id="0" precision="I32">
185
+ <dim>-1</dim>
186
+ </port>
187
+ <port id="1" precision="I32">
188
+ <dim>-1</dim>
189
+ </port>
190
+ <port id="2" precision="U8">
191
+ <dim>-1</dim>
192
+ </port>
193
+ </input>
194
+ <output>
195
+ <port id="3" precision="I32">
196
+ <dim>-1</dim>
197
+ </port>
198
+ <port id="4" precision="I32">
199
+ <dim>-1</dim>
200
+ </port>
201
+ <port id="5" precision="U8">
202
+ <dim>-1</dim>
203
+ </port>
204
+ </output>
205
+ </layer>
206
+ <layer id="13" name="Constant_2498547" type="Const" version="opset1">
207
+ <data element_type="u8" shape="51" offset="1105298" size="51" />
208
+ <output>
209
+ <port id="0" precision="U8">
210
+ <dim>51</dim>
211
+ </port>
212
+ </output>
213
+ </layer>
214
+ <layer id="14" name="Constant_2498549" type="Const" version="opset1">
215
+ <data element_type="u8" shape="2" offset="1105349" size="2" />
216
+ <output>
217
+ <port id="0" precision="U8">
218
+ <dim>2</dim>
219
+ </port>
220
+ </output>
221
+ </layer>
222
+ <layer id="15" name="RegexNormalization_2498550" type="RegexNormalization" version="extension">
223
+ <data global_replace="true" />
224
+ <input>
225
+ <port id="0" precision="I32">
226
+ <dim>-1</dim>
227
+ </port>
228
+ <port id="1" precision="I32">
229
+ <dim>-1</dim>
230
+ </port>
231
+ <port id="2" precision="U8">
232
+ <dim>-1</dim>
233
+ </port>
234
+ <port id="3" precision="U8">
235
+ <dim>51</dim>
236
+ </port>
237
+ <port id="4" precision="U8">
238
+ <dim>2</dim>
239
+ </port>
240
+ </input>
241
+ <output>
242
+ <port id="5" precision="I32">
243
+ <dim>-1</dim>
244
+ </port>
245
+ <port id="6" precision="I32">
246
+ <dim>-1</dim>
247
+ </port>
248
+ <port id="7" precision="U8">
249
+ <dim>-1</dim>
250
+ </port>
251
+ </output>
252
+ </layer>
253
+ <layer id="16" name="StringTensorPack_2498551" type="StringTensorPack" version="extension">
254
+ <data mode="begins_ends" />
255
+ <input>
256
+ <port id="0" precision="I32">
257
+ <dim>-1</dim>
258
+ </port>
259
+ <port id="1" precision="I32">
260
+ <dim>-1</dim>
261
+ </port>
262
+ <port id="2" precision="U8">
263
+ <dim>-1</dim>
264
+ </port>
265
+ </input>
266
+ <output>
267
+ <port id="3" precision="STRING" names="string_output">
268
+ <dim>-1</dim>
269
+ </port>
270
+ </output>
271
+ </layer>
272
+ <layer id="17" name="Result_2498552" type="Result" version="opset1">
273
+ <input>
274
+ <port id="0" precision="STRING">
275
+ <dim>-1</dim>
276
+ </port>
277
+ </input>
278
+ </layer>
279
+ </layers>
280
+ <edges>
281
+ <edge from-layer="0" from-port="0" to-layer="1" to-port="0" />
282
+ <edge from-layer="1" from-port="1" to-layer="10" to-port="0" />
283
+ <edge from-layer="2" from-port="0" to-layer="3" to-port="0" />
284
+ <edge from-layer="3" from-port="1" to-layer="10" to-port="1" />
285
+ <edge from-layer="3" from-port="2" to-layer="10" to-port="2" />
286
+ <edge from-layer="3" from-port="3" to-layer="10" to-port="3" />
287
+ <edge from-layer="4" from-port="0" to-layer="9" to-port="0" />
288
+ <edge from-layer="5" from-port="0" to-layer="9" to-port="1" />
289
+ <edge from-layer="6" from-port="0" to-layer="9" to-port="2" />
290
+ <edge from-layer="7" from-port="0" to-layer="9" to-port="3" />
291
+ <edge from-layer="8" from-port="0" to-layer="9" to-port="4" />
292
+ <edge from-layer="9" from-port="5" to-layer="10" to-port="4" />
293
+ <edge from-layer="10" from-port="7" to-layer="11" to-port="2" />
294
+ <edge from-layer="10" from-port="9" to-layer="12" to-port="2" />
295
+ <edge from-layer="10" from-port="8" to-layer="11" to-port="3" />
296
+ <edge from-layer="10" from-port="6" to-layer="11" to-port="1" />
297
+ <edge from-layer="10" from-port="5" to-layer="11" to-port="0" />
298
+ <edge from-layer="11" from-port="4" to-layer="12" to-port="0" />
299
+ <edge from-layer="11" from-port="5" to-layer="12" to-port="1" />
300
+ <edge from-layer="12" from-port="3" to-layer="15" to-port="0" />
301
+ <edge from-layer="12" from-port="4" to-layer="15" to-port="1" />
302
+ <edge from-layer="12" from-port="5" to-layer="15" to-port="2" />
303
+ <edge from-layer="13" from-port="0" to-layer="15" to-port="3" />
304
+ <edge from-layer="14" from-port="0" to-layer="15" to-port="4" />
305
+ <edge from-layer="15" from-port="5" to-layer="16" to-port="0" />
306
+ <edge from-layer="15" from-port="6" to-layer="16" to-port="1" />
307
+ <edge from-layer="15" from-port="7" to-layer="16" to-port="2" />
308
+ <edge from-layer="16" from-port="3" to-layer="17" to-port="0" />
309
+ </edges>
310
+ <rt_info>
311
+ <add_attention_mask value="True" />
312
+ <add_prefix_space />
313
+ <add_special_tokens value="True" />
314
+ <bos_token_id value="1" />
315
+ <chat_template value="{% for message in messages %}{% if loop.first and message['role'] != 'system' %}{{ '[|system|][|endofturn|]&#10;' }}{% endif %}{% set content = message['content'] %}{% if '&lt;/thought>' in content %}{% set content = content.split('&lt;/thought>')[-1].lstrip('\n') %}{% endif %}{{ '[|' + message['role'] + '|]' + content }}{% if not message['role'] == 'user' %}{{ '[|endofturn|]' }}{% endif %}{% if not loop.last %}{{ '&#10;' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '&#10;[|assistant|]&lt;thought>&#10;' }}{% endif %}" />
316
+ <clean_up_tokenization_spaces />
317
+ <detokenizer_input_type value="i64" />
318
+ <eos_token_id value="361" />
319
+ <handle_special_tokens_with_re />
320
+ <number_of_inputs value="1" />
321
+ <openvino_tokenizers_version value="2025.0.0.0" />
322
+ <openvino_version value="2025.0.0" />
323
+ <original_tokenizer_class value="&lt;class 'transformers.models.gpt2.tokenization_gpt2_fast.GPT2TokenizerFast'>" />
324
+ <pad_token_id value="0" />
325
+ <sentencepiece_version value="0.2.0" />
326
+ <skip_special_tokens value="True" />
327
+ <streaming_detokenizer value="False" />
328
+ <tiktoken_version value="0.7.0" />
329
+ <tokenizer_output_type value="i64" />
330
+ <tokenizers_version value="0.21.1" />
331
+ <transformers_version value="4.50.2" />
332
+ <use_max_padding value="False" />
333
+ <use_sentencepiece_backend value="False" />
334
+ <utf8_replace_mode value="replace" />
335
+ <with_detokenizer value="True" />
336
+ </rt_info>
337
+ </net>
openvino_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35494ac62c093cfb62331d92f58060380ca6a81848b743649dce06e9e575af53
3
+ size 4466516576
openvino_model.xml ADDED
The diff for this file is too large to render. See raw diff
 
openvino_tokenizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf05f6d95cb9bae5b403af6fdbd002130b213159474761fda34cdca127d69a3c
3
+ size 2622080
openvino_tokenizer.xml ADDED
@@ -0,0 +1,798 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <?xml version="1.0"?>
2
+ <net name="tokenizer" version="11">
3
+ <layers>
4
+ <layer id="0" name="Parameter_2498426" type="Parameter" version="opset1">
5
+ <data shape="?" element_type="string" />
6
+ <output>
7
+ <port id="0" precision="STRING" names="Parameter_2498426">
8
+ <dim>-1</dim>
9
+ </port>
10
+ </output>
11
+ </layer>
12
+ <layer id="1" name="Constant_2498432" type="Const" version="opset1">
13
+ <data element_type="i64" shape="" offset="0" size="8" />
14
+ <output>
15
+ <port id="0" precision="I64" />
16
+ </output>
17
+ </layer>
18
+ <layer id="2" name="StringTensorUnpack_2498427" type="StringTensorUnpack" version="extension">
19
+ <data mode="begins_ends" />
20
+ <input>
21
+ <port id="0" precision="STRING">
22
+ <dim>-1</dim>
23
+ </port>
24
+ </input>
25
+ <output>
26
+ <port id="1" precision="I32">
27
+ <dim>-1</dim>
28
+ </port>
29
+ <port id="2" precision="I32">
30
+ <dim>-1</dim>
31
+ </port>
32
+ <port id="3" precision="U8">
33
+ <dim>-1</dim>
34
+ </port>
35
+ </output>
36
+ </layer>
37
+ <layer id="3" name="ShapeOf_2498428" type="ShapeOf" version="opset3">
38
+ <data output_type="i64" />
39
+ <input>
40
+ <port id="0" precision="I32">
41
+ <dim>-1</dim>
42
+ </port>
43
+ </input>
44
+ <output>
45
+ <port id="1" precision="I64">
46
+ <dim>1</dim>
47
+ </port>
48
+ </output>
49
+ </layer>
50
+ <layer id="4" name="Constant_2498429" type="Const" version="opset1">
51
+ <data element_type="i64" shape="" offset="0" size="8" />
52
+ <output>
53
+ <port id="0" precision="I64" />
54
+ </output>
55
+ </layer>
56
+ <layer id="5" name="Constant_2498430" type="Const" version="opset1">
57
+ <data element_type="i64" shape="" offset="0" size="8" />
58
+ <output>
59
+ <port id="0" precision="I64" />
60
+ </output>
61
+ </layer>
62
+ <layer id="6" name="Gather_2498431" type="Gather" version="opset8">
63
+ <data batch_dims="0" />
64
+ <input>
65
+ <port id="0" precision="I64">
66
+ <dim>1</dim>
67
+ </port>
68
+ <port id="1" precision="I64" />
69
+ <port id="2" precision="I64" />
70
+ </input>
71
+ <output>
72
+ <port id="3" precision="I64" />
73
+ </output>
74
+ </layer>
75
+ <layer id="7" name="Constant_2498433" type="Const" version="opset1">
76
+ <data element_type="i64" shape="" offset="8" size="8" />
77
+ <output>
78
+ <port id="0" precision="I64" />
79
+ </output>
80
+ </layer>
81
+ <layer id="8" name="Range_2498434" type="Range" version="opset4">
82
+ <data output_type="i32" />
83
+ <input>
84
+ <port id="0" precision="I64" />
85
+ <port id="1" precision="I64" />
86
+ <port id="2" precision="I64" />
87
+ </input>
88
+ <output>
89
+ <port id="3" precision="I32">
90
+ <dim>-1</dim>
91
+ </port>
92
+ </output>
93
+ </layer>
94
+ <layer id="9" name="Constant_2498435" type="Const" version="opset1">
95
+ <data element_type="i64" shape="" offset="8" size="8" />
96
+ <output>
97
+ <port id="0" precision="I64" />
98
+ </output>
99
+ </layer>
100
+ <layer id="10" name="Constant_2498436" type="Const" version="opset1">
101
+ <data element_type="i64" shape="" offset="8" size="8" />
102
+ <output>
103
+ <port id="0" precision="I64" />
104
+ </output>
105
+ </layer>
106
+ <layer id="11" name="Add_2498437" type="Add" version="opset1">
107
+ <data auto_broadcast="numpy" />
108
+ <input>
109
+ <port id="0" precision="I64" />
110
+ <port id="1" precision="I64" />
111
+ </input>
112
+ <output>
113
+ <port id="2" precision="I64" />
114
+ </output>
115
+ </layer>
116
+ <layer id="12" name="Constant_2498438" type="Const" version="opset1">
117
+ <data element_type="i64" shape="" offset="8" size="8" />
118
+ <output>
119
+ <port id="0" precision="I64" />
120
+ </output>
121
+ </layer>
122
+ <layer id="13" name="Range_2498439" type="Range" version="opset4">
123
+ <data output_type="i32" />
124
+ <input>
125
+ <port id="0" precision="I64" />
126
+ <port id="1" precision="I64" />
127
+ <port id="2" precision="I64" />
128
+ </input>
129
+ <output>
130
+ <port id="3" precision="I32">
131
+ <dim>-1</dim>
132
+ </port>
133
+ </output>
134
+ </layer>
135
+ <layer id="14" name="Constant_2498501" type="Const" version="opset1">
136
+ <data element_type="u8" shape="6709" offset="16" size="6709" />
137
+ <output>
138
+ <port id="0" precision="U8">
139
+ <dim>6709</dim>
140
+ </port>
141
+ </output>
142
+ </layer>
143
+ <layer id="15" name="SpecialTokensSplit_2498502" type="SpecialTokensSplit" version="extension">
144
+ <input>
145
+ <port id="0" precision="I32">
146
+ <dim>-1</dim>
147
+ </port>
148
+ <port id="1" precision="I32">
149
+ <dim>-1</dim>
150
+ </port>
151
+ <port id="2" precision="I32">
152
+ <dim>-1</dim>
153
+ </port>
154
+ <port id="3" precision="I32">
155
+ <dim>-1</dim>
156
+ </port>
157
+ <port id="4" precision="U8">
158
+ <dim>-1</dim>
159
+ </port>
160
+ <port id="5" precision="U8">
161
+ <dim>6709</dim>
162
+ </port>
163
+ </input>
164
+ <output>
165
+ <port id="6" precision="I32">
166
+ <dim>-1</dim>
167
+ </port>
168
+ <port id="7" precision="I32">
169
+ <dim>-1</dim>
170
+ </port>
171
+ <port id="8" precision="I32">
172
+ <dim>-1</dim>
173
+ </port>
174
+ <port id="9" precision="I32">
175
+ <dim>-1</dim>
176
+ </port>
177
+ <port id="10" precision="U8">
178
+ <dim>-1</dim>
179
+ </port>
180
+ <port id="11" precision="BOOL">
181
+ <dim>-1</dim>
182
+ </port>
183
+ </output>
184
+ </layer>
185
+ <layer id="16" name="NormalizeUnicode_2498503" type="NormalizeUnicode" version="extension">
186
+ <data normalization_form="NFKC" />
187
+ <input>
188
+ <port id="0" precision="I32">
189
+ <dim>-1</dim>
190
+ </port>
191
+ <port id="1" precision="I32">
192
+ <dim>-1</dim>
193
+ </port>
194
+ <port id="2" precision="U8">
195
+ <dim>-1</dim>
196
+ </port>
197
+ <port id="3" precision="BOOL">
198
+ <dim>-1</dim>
199
+ </port>
200
+ </input>
201
+ <output>
202
+ <port id="4" precision="I32">
203
+ <dim>-1</dim>
204
+ </port>
205
+ <port id="5" precision="I32">
206
+ <dim>-1</dim>
207
+ </port>
208
+ <port id="6" precision="U8">
209
+ <dim>-1</dim>
210
+ </port>
211
+ <port id="7" precision="BOOL">
212
+ <dim>-1</dim>
213
+ </port>
214
+ </output>
215
+ </layer>
216
+ <layer id="17" name="Constant_2498505" type="Const" version="opset1">
217
+ <data element_type="u8" shape="20" offset="6725" size="20" />
218
+ <output>
219
+ <port id="0" precision="U8">
220
+ <dim>20</dim>
221
+ </port>
222
+ </output>
223
+ </layer>
224
+ <layer id="18" name="RegexSplit_2498506" type="RegexSplit" version="extension">
225
+ <data behaviour="isolate" invert="false" max_splits="-1" />
226
+ <input>
227
+ <port id="0" precision="I32">
228
+ <dim>-1</dim>
229
+ </port>
230
+ <port id="1" precision="I32">
231
+ <dim>-1</dim>
232
+ </port>
233
+ <port id="2" precision="I32">
234
+ <dim>-1</dim>
235
+ </port>
236
+ <port id="3" precision="I32">
237
+ <dim>-1</dim>
238
+ </port>
239
+ <port id="4" precision="U8">
240
+ <dim>-1</dim>
241
+ </port>
242
+ <port id="5" precision="BOOL">
243
+ <dim>-1</dim>
244
+ </port>
245
+ <port id="6" precision="U8">
246
+ <dim>20</dim>
247
+ </port>
248
+ </input>
249
+ <output>
250
+ <port id="7" precision="I32">
251
+ <dim>-1</dim>
252
+ </port>
253
+ <port id="8" precision="I32">
254
+ <dim>-1</dim>
255
+ </port>
256
+ <port id="9" precision="I32">
257
+ <dim>-1</dim>
258
+ </port>
259
+ <port id="10" precision="I32">
260
+ <dim>-1</dim>
261
+ </port>
262
+ <port id="11" precision="U8">
263
+ <dim>-1</dim>
264
+ </port>
265
+ <port id="12" precision="BOOL">
266
+ <dim>-1</dim>
267
+ </port>
268
+ </output>
269
+ </layer>
270
+ <layer id="19" name="Constant_2498508" type="Const" version="opset1">
271
+ <data element_type="u8" shape="64" offset="6745" size="64" />
272
+ <output>
273
+ <port id="0" precision="U8">
274
+ <dim>64</dim>
275
+ </port>
276
+ </output>
277
+ </layer>
278
+ <layer id="20" name="RegexSplit_2498509" type="RegexSplit" version="extension">
279
+ <data behaviour="isolate" invert="false" max_splits="-1" />
280
+ <input>
281
+ <port id="0" precision="I32">
282
+ <dim>-1</dim>
283
+ </port>
284
+ <port id="1" precision="I32">
285
+ <dim>-1</dim>
286
+ </port>
287
+ <port id="2" precision="I32">
288
+ <dim>-1</dim>
289
+ </port>
290
+ <port id="3" precision="I32">
291
+ <dim>-1</dim>
292
+ </port>
293
+ <port id="4" precision="U8">
294
+ <dim>-1</dim>
295
+ </port>
296
+ <port id="5" precision="BOOL">
297
+ <dim>-1</dim>
298
+ </port>
299
+ <port id="6" precision="U8">
300
+ <dim>64</dim>
301
+ </port>
302
+ </input>
303
+ <output>
304
+ <port id="7" precision="I32">
305
+ <dim>-1</dim>
306
+ </port>
307
+ <port id="8" precision="I32">
308
+ <dim>-1</dim>
309
+ </port>
310
+ <port id="9" precision="I32">
311
+ <dim>-1</dim>
312
+ </port>
313
+ <port id="10" precision="I32">
314
+ <dim>-1</dim>
315
+ </port>
316
+ <port id="11" precision="U8">
317
+ <dim>-1</dim>
318
+ </port>
319
+ <port id="12" precision="BOOL">
320
+ <dim>-1</dim>
321
+ </port>
322
+ </output>
323
+ </layer>
324
+ <layer id="21" name="Constant_2498511" type="Const" version="opset1">
325
+ <data element_type="u8" shape="1103982" offset="6809" size="1103982" />
326
+ <output>
327
+ <port id="0" precision="U8">
328
+ <dim>1103982</dim>
329
+ </port>
330
+ </output>
331
+ </layer>
332
+ <layer id="22" name="StringTensorUnpack_2498512" type="StringTensorUnpack" version="extension">
333
+ <data mode="begins_ends" />
334
+ <input>
335
+ <port id="0" precision="U8">
336
+ <dim>1103982</dim>
337
+ </port>
338
+ </input>
339
+ <output>
340
+ <port id="1" precision="I32">
341
+ <dim>-1</dim>
342
+ </port>
343
+ <port id="2" precision="I32">
344
+ <dim>-1</dim>
345
+ </port>
346
+ <port id="3" precision="U8">
347
+ <dim>-1</dim>
348
+ </port>
349
+ </output>
350
+ </layer>
351
+ <layer id="23" name="Constant_2498517" type="Const" version="opset1">
352
+ <data element_type="u8" shape="784577" offset="1110791" size="784577" />
353
+ <output>
354
+ <port id="0" precision="U8">
355
+ <dim>784577</dim>
356
+ </port>
357
+ </output>
358
+ </layer>
359
+ <layer id="24" name="StringTensorUnpack_2498518" type="StringTensorUnpack" version="extension">
360
+ <data mode="begins_ends" />
361
+ <input>
362
+ <port id="0" precision="U8">
363
+ <dim>784577</dim>
364
+ </port>
365
+ </input>
366
+ <output>
367
+ <port id="1" precision="I32">
368
+ <dim>-1</dim>
369
+ </port>
370
+ <port id="2" precision="I32">
371
+ <dim>-1</dim>
372
+ </port>
373
+ <port id="3" precision="U8">
374
+ <dim>-1</dim>
375
+ </port>
376
+ </output>
377
+ </layer>
378
+ <layer id="25" name="Constant_2498520" type="Const" version="opset1">
379
+ <data element_type="u8" shape="719390" offset="1895368" size="719390" />
380
+ <output>
381
+ <port id="0" precision="U8">
382
+ <dim>719390</dim>
383
+ </port>
384
+ </output>
385
+ </layer>
386
+ <layer id="26" name="StringTensorUnpack_2498521" type="StringTensorUnpack" version="extension">
387
+ <data mode="begins_ends" />
388
+ <input>
389
+ <port id="0" precision="U8">
390
+ <dim>719390</dim>
391
+ </port>
392
+ </input>
393
+ <output>
394
+ <port id="1" precision="I32">
395
+ <dim>-1</dim>
396
+ </port>
397
+ <port id="2" precision="I32">
398
+ <dim>-1</dim>
399
+ </port>
400
+ <port id="3" precision="U8">
401
+ <dim>-1</dim>
402
+ </port>
403
+ </output>
404
+ </layer>
405
+ <layer id="27" name="Constant_2498514" type="Const" version="opset1">
406
+ <data element_type="u8" shape="5870" offset="2614758" size="5870" />
407
+ <output>
408
+ <port id="0" precision="U8">
409
+ <dim>5870</dim>
410
+ </port>
411
+ </output>
412
+ </layer>
413
+ <layer id="28" name="StringTensorUnpack_2498515" type="StringTensorUnpack" version="extension">
414
+ <data mode="begins_ends" />
415
+ <input>
416
+ <port id="0" precision="U8">
417
+ <dim>5870</dim>
418
+ </port>
419
+ </input>
420
+ <output>
421
+ <port id="1" precision="I32">
422
+ <dim>-1</dim>
423
+ </port>
424
+ <port id="2" precision="I32">
425
+ <dim>-1</dim>
426
+ </port>
427
+ <port id="3" precision="U8">
428
+ <dim>-1</dim>
429
+ </port>
430
+ </output>
431
+ </layer>
432
+ <layer id="29" name="Constant_2498522" type="Const" version="opset1">
433
+ <data element_type="i32" shape="361" offset="2620628" size="1444" />
434
+ <output>
435
+ <port id="0" precision="I32">
436
+ <dim>361</dim>
437
+ </port>
438
+ </output>
439
+ </layer>
440
+ <layer id="30" name="BPETokenizer_2498523" type="BPETokenizer" version="extension">
441
+ <data unk_token="" fuse_unk="false" suffix_indicator="" end_suffix="" byte_fallback="false" cache_capacity="20480" />
442
+ <input>
443
+ <port id="0" precision="I32">
444
+ <dim>-1</dim>
445
+ </port>
446
+ <port id="1" precision="I32">
447
+ <dim>-1</dim>
448
+ </port>
449
+ <port id="2" precision="I32">
450
+ <dim>-1</dim>
451
+ </port>
452
+ <port id="3" precision="I32">
453
+ <dim>-1</dim>
454
+ </port>
455
+ <port id="4" precision="U8">
456
+ <dim>-1</dim>
457
+ </port>
458
+ <port id="5" precision="I32">
459
+ <dim>-1</dim>
460
+ </port>
461
+ <port id="6" precision="I32">
462
+ <dim>-1</dim>
463
+ </port>
464
+ <port id="7" precision="U8">
465
+ <dim>-1</dim>
466
+ </port>
467
+ <port id="8" precision="I32">
468
+ <dim>-1</dim>
469
+ </port>
470
+ <port id="9" precision="I32">
471
+ <dim>-1</dim>
472
+ </port>
473
+ <port id="10" precision="U8">
474
+ <dim>-1</dim>
475
+ </port>
476
+ <port id="11" precision="I32">
477
+ <dim>-1</dim>
478
+ </port>
479
+ <port id="12" precision="I32">
480
+ <dim>-1</dim>
481
+ </port>
482
+ <port id="13" precision="U8">
483
+ <dim>-1</dim>
484
+ </port>
485
+ <port id="14" precision="I32">
486
+ <dim>-1</dim>
487
+ </port>
488
+ <port id="15" precision="I32">
489
+ <dim>-1</dim>
490
+ </port>
491
+ <port id="16" precision="U8">
492
+ <dim>-1</dim>
493
+ </port>
494
+ <port id="17" precision="I32">
495
+ <dim>361</dim>
496
+ </port>
497
+ </input>
498
+ <output>
499
+ <port id="18" precision="I32">
500
+ <dim>-1</dim>
501
+ </port>
502
+ <port id="19" precision="I32">
503
+ <dim>-1</dim>
504
+ </port>
505
+ <port id="20" precision="I32">
506
+ <dim>-1</dim>
507
+ </port>
508
+ </output>
509
+ </layer>
510
+ <layer id="31" name="Subtract_2498524" type="Subtract" version="opset1">
511
+ <data auto_broadcast="numpy" />
512
+ <input>
513
+ <port id="0" precision="I32">
514
+ <dim>-1</dim>
515
+ </port>
516
+ <port id="1" precision="I32">
517
+ <dim>-1</dim>
518
+ </port>
519
+ </input>
520
+ <output>
521
+ <port id="2" precision="I32">
522
+ <dim>-1</dim>
523
+ </port>
524
+ </output>
525
+ </layer>
526
+ <layer id="32" name="Constant_2498525" type="Const" version="opset1">
527
+ <data element_type="i32" shape="" offset="2622072" size="4" />
528
+ <output>
529
+ <port id="0" precision="I32" />
530
+ </output>
531
+ </layer>
532
+ <layer id="33" name="Minimum_2498526" type="Minimum" version="opset1">
533
+ <data auto_broadcast="numpy" />
534
+ <input>
535
+ <port id="0" precision="I32">
536
+ <dim>-1</dim>
537
+ </port>
538
+ <port id="1" precision="I32" />
539
+ </input>
540
+ <output>
541
+ <port id="2" precision="I32">
542
+ <dim>-1</dim>
543
+ </port>
544
+ </output>
545
+ </layer>
546
+ <layer id="34" name="Subtract_2498527" type="Subtract" version="opset1">
547
+ <data auto_broadcast="numpy" />
548
+ <input>
549
+ <port id="0" precision="I32">
550
+ <dim>-1</dim>
551
+ </port>
552
+ <port id="1" precision="I32">
553
+ <dim>-1</dim>
554
+ </port>
555
+ </input>
556
+ <output>
557
+ <port id="2" precision="I32">
558
+ <dim>-1</dim>
559
+ </port>
560
+ </output>
561
+ </layer>
562
+ <layer id="35" name="Subtract_2498528" type="Subtract" version="opset1">
563
+ <data auto_broadcast="numpy" />
564
+ <input>
565
+ <port id="0" precision="I32">
566
+ <dim>-1</dim>
567
+ </port>
568
+ <port id="1" precision="I32">
569
+ <dim>-1</dim>
570
+ </port>
571
+ </input>
572
+ <output>
573
+ <port id="2" precision="I32">
574
+ <dim>-1</dim>
575
+ </port>
576
+ </output>
577
+ </layer>
578
+ <layer id="36" name="Constant_2498529" type="Const" version="opset1">
579
+ <data element_type="i32" shape="" offset="2622076" size="4" />
580
+ <output>
581
+ <port id="0" precision="I32" />
582
+ </output>
583
+ </layer>
584
+ <layer id="37" name="ReduceMax_2498530" type="ReduceMax" version="opset1">
585
+ <data keep_dims="false" />
586
+ <input>
587
+ <port id="0" precision="I32">
588
+ <dim>-1</dim>
589
+ </port>
590
+ <port id="1" precision="I32" />
591
+ </input>
592
+ <output>
593
+ <port id="2" precision="I32" />
594
+ </output>
595
+ </layer>
596
+ <layer id="38" name="Constant_2498531" type="Const" version="opset1">
597
+ <data element_type="i32" shape="" offset="2622076" size="4" />
598
+ <output>
599
+ <port id="0" precision="I32" />
600
+ </output>
601
+ </layer>
602
+ <layer id="39" name="RaggedToDense_2498532" type="RaggedToDense" version="extension">
603
+ <data pad_right="false" />
604
+ <input>
605
+ <port id="0" precision="I32">
606
+ <dim>-1</dim>
607
+ </port>
608
+ <port id="1" precision="I32">
609
+ <dim>-1</dim>
610
+ </port>
611
+ <port id="2" precision="I32">
612
+ <dim>-1</dim>
613
+ </port>
614
+ <port id="3" precision="I32" />
615
+ <port id="4" precision="I32" />
616
+ </input>
617
+ <output>
618
+ <port id="5" precision="I32">
619
+ <dim>-1</dim>
620
+ <dim>-1</dim>
621
+ </port>
622
+ <port id="6" precision="BOOL">
623
+ <dim>-1</dim>
624
+ <dim>-1</dim>
625
+ </port>
626
+ </output>
627
+ </layer>
628
+ <layer id="40" name="Convert_2498533" type="Convert" version="opset1">
629
+ <data destination_type="i32" />
630
+ <input>
631
+ <port id="0" precision="BOOL">
632
+ <dim>-1</dim>
633
+ <dim>-1</dim>
634
+ </port>
635
+ </input>
636
+ <output>
637
+ <port id="1" precision="I32">
638
+ <dim>-1</dim>
639
+ <dim>-1</dim>
640
+ </port>
641
+ </output>
642
+ </layer>
643
+ <layer id="41" name="Convert_2498533.0" type="Convert" version="opset1">
644
+ <data destination_type="i64" />
645
+ <input>
646
+ <port id="0" precision="I32">
647
+ <dim>-1</dim>
648
+ <dim>-1</dim>
649
+ </port>
650
+ </input>
651
+ <output>
652
+ <port id="1" precision="I64" names="attention_mask">
653
+ <dim>-1</dim>
654
+ <dim>-1</dim>
655
+ </port>
656
+ </output>
657
+ </layer>
658
+ <layer id="43" name="RaggedToDense_2498532.0" type="Convert" version="opset1">
659
+ <data destination_type="i64" />
660
+ <input>
661
+ <port id="0" precision="I32">
662
+ <dim>-1</dim>
663
+ <dim>-1</dim>
664
+ </port>
665
+ </input>
666
+ <output>
667
+ <port id="1" precision="I64" names="input_ids">
668
+ <dim>-1</dim>
669
+ <dim>-1</dim>
670
+ </port>
671
+ </output>
672
+ </layer>
673
+ <layer id="44" name="Result_2498534" type="Result" version="opset1">
674
+ <input>
675
+ <port id="0" precision="I64">
676
+ <dim>-1</dim>
677
+ <dim>-1</dim>
678
+ </port>
679
+ </input>
680
+ </layer>
681
+ <layer id="42" name="Result_2498535" type="Result" version="opset1">
682
+ <input>
683
+ <port id="0" precision="I64">
684
+ <dim>-1</dim>
685
+ <dim>-1</dim>
686
+ </port>
687
+ </input>
688
+ </layer>
689
+ </layers>
690
+ <edges>
691
+ <edge from-layer="0" from-port="0" to-layer="2" to-port="0" />
692
+ <edge from-layer="1" from-port="0" to-layer="8" to-port="0" />
693
+ <edge from-layer="2" from-port="1" to-layer="3" to-port="0" />
694
+ <edge from-layer="2" from-port="3" to-layer="15" to-port="4" />
695
+ <edge from-layer="2" from-port="2" to-layer="15" to-port="3" />
696
+ <edge from-layer="2" from-port="1" to-layer="15" to-port="2" />
697
+ <edge from-layer="3" from-port="1" to-layer="6" to-port="0" />
698
+ <edge from-layer="4" from-port="0" to-layer="6" to-port="1" />
699
+ <edge from-layer="5" from-port="0" to-layer="6" to-port="2" />
700
+ <edge from-layer="6" from-port="3" to-layer="8" to-port="1" />
701
+ <edge from-layer="6" from-port="3" to-layer="11" to-port="0" />
702
+ <edge from-layer="7" from-port="0" to-layer="8" to-port="2" />
703
+ <edge from-layer="8" from-port="3" to-layer="15" to-port="0" />
704
+ <edge from-layer="9" from-port="0" to-layer="13" to-port="0" />
705
+ <edge from-layer="10" from-port="0" to-layer="11" to-port="1" />
706
+ <edge from-layer="11" from-port="2" to-layer="13" to-port="1" />
707
+ <edge from-layer="12" from-port="0" to-layer="13" to-port="2" />
708
+ <edge from-layer="13" from-port="3" to-layer="15" to-port="1" />
709
+ <edge from-layer="14" from-port="0" to-layer="15" to-port="5" />
710
+ <edge from-layer="15" from-port="8" to-layer="16" to-port="0" />
711
+ <edge from-layer="15" from-port="9" to-layer="16" to-port="1" />
712
+ <edge from-layer="15" from-port="10" to-layer="16" to-port="2" />
713
+ <edge from-layer="15" from-port="11" to-layer="16" to-port="3" />
714
+ <edge from-layer="15" from-port="6" to-layer="18" to-port="0" />
715
+ <edge from-layer="15" from-port="7" to-layer="18" to-port="1" />
716
+ <edge from-layer="16" from-port="4" to-layer="18" to-port="2" />
717
+ <edge from-layer="16" from-port="7" to-layer="18" to-port="5" />
718
+ <edge from-layer="16" from-port="5" to-layer="18" to-port="3" />
719
+ <edge from-layer="16" from-port="6" to-layer="18" to-port="4" />
720
+ <edge from-layer="17" from-port="0" to-layer="18" to-port="6" />
721
+ <edge from-layer="18" from-port="7" to-layer="20" to-port="0" />
722
+ <edge from-layer="18" from-port="8" to-layer="20" to-port="1" />
723
+ <edge from-layer="18" from-port="9" to-layer="20" to-port="2" />
724
+ <edge from-layer="18" from-port="10" to-layer="20" to-port="3" />
725
+ <edge from-layer="18" from-port="11" to-layer="20" to-port="4" />
726
+ <edge from-layer="18" from-port="12" to-layer="20" to-port="5" />
727
+ <edge from-layer="19" from-port="0" to-layer="20" to-port="6" />
728
+ <edge from-layer="20" from-port="7" to-layer="30" to-port="0" />
729
+ <edge from-layer="20" from-port="8" to-layer="30" to-port="1" />
730
+ <edge from-layer="20" from-port="9" to-layer="30" to-port="2" />
731
+ <edge from-layer="20" from-port="10" to-layer="30" to-port="3" />
732
+ <edge from-layer="20" from-port="11" to-layer="30" to-port="4" />
733
+ <edge from-layer="21" from-port="0" to-layer="22" to-port="0" />
734
+ <edge from-layer="22" from-port="2" to-layer="30" to-port="6" />
735
+ <edge from-layer="22" from-port="3" to-layer="30" to-port="7" />
736
+ <edge from-layer="22" from-port="1" to-layer="30" to-port="5" />
737
+ <edge from-layer="23" from-port="0" to-layer="24" to-port="0" />
738
+ <edge from-layer="24" from-port="1" to-layer="30" to-port="8" />
739
+ <edge from-layer="24" from-port="2" to-layer="30" to-port="9" />
740
+ <edge from-layer="24" from-port="3" to-layer="30" to-port="10" />
741
+ <edge from-layer="25" from-port="0" to-layer="26" to-port="0" />
742
+ <edge from-layer="26" from-port="1" to-layer="30" to-port="11" />
743
+ <edge from-layer="26" from-port="2" to-layer="30" to-port="12" />
744
+ <edge from-layer="26" from-port="3" to-layer="30" to-port="13" />
745
+ <edge from-layer="27" from-port="0" to-layer="28" to-port="0" />
746
+ <edge from-layer="28" from-port="1" to-layer="30" to-port="14" />
747
+ <edge from-layer="28" from-port="2" to-layer="30" to-port="15" />
748
+ <edge from-layer="28" from-port="3" to-layer="30" to-port="16" />
749
+ <edge from-layer="29" from-port="0" to-layer="30" to-port="17" />
750
+ <edge from-layer="30" from-port="19" to-layer="35" to-port="0" />
751
+ <edge from-layer="30" from-port="20" to-layer="39" to-port="2" />
752
+ <edge from-layer="30" from-port="19" to-layer="39" to-port="1" />
753
+ <edge from-layer="30" from-port="19" to-layer="34" to-port="0" />
754
+ <edge from-layer="30" from-port="18" to-layer="31" to-port="1" />
755
+ <edge from-layer="30" from-port="19" to-layer="31" to-port="0" />
756
+ <edge from-layer="31" from-port="2" to-layer="33" to-port="0" />
757
+ <edge from-layer="32" from-port="0" to-layer="33" to-port="1" />
758
+ <edge from-layer="33" from-port="2" to-layer="34" to-port="1" />
759
+ <edge from-layer="34" from-port="2" to-layer="35" to-port="1" />
760
+ <edge from-layer="34" from-port="2" to-layer="39" to-port="0" />
761
+ <edge from-layer="35" from-port="2" to-layer="37" to-port="0" />
762
+ <edge from-layer="36" from-port="0" to-layer="37" to-port="1" />
763
+ <edge from-layer="37" from-port="2" to-layer="39" to-port="3" />
764
+ <edge from-layer="38" from-port="0" to-layer="39" to-port="4" />
765
+ <edge from-layer="39" from-port="6" to-layer="40" to-port="0" />
766
+ <edge from-layer="39" from-port="5" to-layer="43" to-port="0" />
767
+ <edge from-layer="40" from-port="1" to-layer="41" to-port="0" />
768
+ <edge from-layer="41" from-port="1" to-layer="42" to-port="0" />
769
+ <edge from-layer="43" from-port="1" to-layer="44" to-port="0" />
770
+ </edges>
771
+ <rt_info>
772
+ <add_attention_mask value="True" />
773
+ <add_prefix_space />
774
+ <add_special_tokens value="True" />
775
+ <bos_token_id value="1" />
776
+ <chat_template value="{% for message in messages %}{% if loop.first and message['role'] != 'system' %}{{ '[|system|][|endofturn|]&#10;' }}{% endif %}{% set content = message['content'] %}{% if '&lt;/thought>' in content %}{% set content = content.split('&lt;/thought>')[-1].lstrip('\n') %}{% endif %}{{ '[|' + message['role'] + '|]' + content }}{% if not message['role'] == 'user' %}{{ '[|endofturn|]' }}{% endif %}{% if not loop.last %}{{ '&#10;' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '&#10;[|assistant|]&lt;thought>&#10;' }}{% endif %}" />
777
+ <clean_up_tokenization_spaces />
778
+ <detokenizer_input_type value="i64" />
779
+ <eos_token_id value="361" />
780
+ <handle_special_tokens_with_re />
781
+ <number_of_inputs value="1" />
782
+ <openvino_tokenizers_version value="2025.0.0.0" />
783
+ <openvino_version value="2025.0.0" />
784
+ <original_tokenizer_class value="&lt;class 'transformers.models.gpt2.tokenization_gpt2_fast.GPT2TokenizerFast'>" />
785
+ <pad_token_id value="0" />
786
+ <sentencepiece_version value="0.2.0" />
787
+ <skip_special_tokens value="True" />
788
+ <streaming_detokenizer value="False" />
789
+ <tiktoken_version value="0.7.0" />
790
+ <tokenizer_output_type value="i64" />
791
+ <tokenizers_version value="0.21.1" />
792
+ <transformers_version value="4.50.2" />
793
+ <use_max_padding value="False" />
794
+ <use_sentencepiece_backend value="False" />
795
+ <utf8_replace_mode value="replace" />
796
+ <with_detokenizer value="True" />
797
+ </rt_info>
798
+ </net>
special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "[BOS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "[|endofturn|]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "[UNK]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,3222 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "[PAD]",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "[BOS]",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "[EOS]",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": "[UNK]",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "4": {
37
+ "content": " ",
38
+ "lstrip": false,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": false
43
+ },
44
+ "5": {
45
+ "content": " ",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false,
50
+ "special": false
51
+ },
52
+ "6": {
53
+ "content": " ",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false,
58
+ "special": false
59
+ },
60
+ "7": {
61
+ "content": " ",
62
+ "lstrip": false,
63
+ "normalized": false,
64
+ "rstrip": false,
65
+ "single_word": false,
66
+ "special": false
67
+ },
68
+ "8": {
69
+ "content": " ",
70
+ "lstrip": false,
71
+ "normalized": false,
72
+ "rstrip": false,
73
+ "single_word": false,
74
+ "special": false
75
+ },
76
+ "9": {
77
+ "content": " ",
78
+ "lstrip": false,
79
+ "normalized": false,
80
+ "rstrip": false,
81
+ "single_word": false,
82
+ "special": false
83
+ },
84
+ "10": {
85
+ "content": " ",
86
+ "lstrip": false,
87
+ "normalized": false,
88
+ "rstrip": false,
89
+ "single_word": false,
90
+ "special": false
91
+ },
92
+ "11": {
93
+ "content": " ",
94
+ "lstrip": false,
95
+ "normalized": false,
96
+ "rstrip": false,
97
+ "single_word": false,
98
+ "special": false
99
+ },
100
+ "12": {
101
+ "content": " ",
102
+ "lstrip": false,
103
+ "normalized": false,
104
+ "rstrip": false,
105
+ "single_word": false,
106
+ "special": false
107
+ },
108
+ "13": {
109
+ "content": " ",
110
+ "lstrip": false,
111
+ "normalized": false,
112
+ "rstrip": false,
113
+ "single_word": false,
114
+ "special": false
115
+ },
116
+ "14": {
117
+ "content": " ",
118
+ "lstrip": false,
119
+ "normalized": false,
120
+ "rstrip": false,
121
+ "single_word": false,
122
+ "special": false
123
+ },
124
+ "15": {
125
+ "content": " ",
126
+ "lstrip": false,
127
+ "normalized": false,
128
+ "rstrip": false,
129
+ "single_word": false,
130
+ "special": false
131
+ },
132
+ "16": {
133
+ "content": " ",
134
+ "lstrip": false,
135
+ "normalized": false,
136
+ "rstrip": false,
137
+ "single_word": false,
138
+ "special": false
139
+ },
140
+ "17": {
141
+ "content": " ",
142
+ "lstrip": false,
143
+ "normalized": false,
144
+ "rstrip": false,
145
+ "single_word": false,
146
+ "special": false
147
+ },
148
+ "18": {
149
+ "content": " ",
150
+ "lstrip": false,
151
+ "normalized": false,
152
+ "rstrip": false,
153
+ "single_word": false,
154
+ "special": false
155
+ },
156
+ "19": {
157
+ "content": " ",
158
+ "lstrip": false,
159
+ "normalized": false,
160
+ "rstrip": false,
161
+ "single_word": false,
162
+ "special": false
163
+ },
164
+ "20": {
165
+ "content": " ",
166
+ "lstrip": false,
167
+ "normalized": false,
168
+ "rstrip": false,
169
+ "single_word": false,
170
+ "special": false
171
+ },
172
+ "21": {
173
+ "content": " ",
174
+ "lstrip": false,
175
+ "normalized": false,
176
+ "rstrip": false,
177
+ "single_word": false,
178
+ "special": false
179
+ },
180
+ "22": {
181
+ "content": " ",
182
+ "lstrip": false,
183
+ "normalized": false,
184
+ "rstrip": false,
185
+ "single_word": false,
186
+ "special": false
187
+ },
188
+ "23": {
189
+ "content": " ",
190
+ "lstrip": false,
191
+ "normalized": false,
192
+ "rstrip": false,
193
+ "single_word": false,
194
+ "special": false
195
+ },
196
+ "24": {
197
+ "content": " ",
198
+ "lstrip": false,
199
+ "normalized": false,
200
+ "rstrip": false,
201
+ "single_word": false,
202
+ "special": false
203
+ },
204
+ "25": {
205
+ "content": " ",
206
+ "lstrip": false,
207
+ "normalized": false,
208
+ "rstrip": false,
209
+ "single_word": false,
210
+ "special": false
211
+ },
212
+ "26": {
213
+ "content": " ",
214
+ "lstrip": false,
215
+ "normalized": false,
216
+ "rstrip": false,
217
+ "single_word": false,
218
+ "special": false
219
+ },
220
+ "27": {
221
+ "content": " ",
222
+ "lstrip": false,
223
+ "normalized": false,
224
+ "rstrip": false,
225
+ "single_word": false,
226
+ "special": false
227
+ },
228
+ "28": {
229
+ "content": " ",
230
+ "lstrip": false,
231
+ "normalized": false,
232
+ "rstrip": false,
233
+ "single_word": false,
234
+ "special": false
235
+ },
236
+ "29": {
237
+ "content": " ",
238
+ "lstrip": false,
239
+ "normalized": false,
240
+ "rstrip": false,
241
+ "single_word": false,
242
+ "special": false
243
+ },
244
+ "30": {
245
+ "content": " ",
246
+ "lstrip": false,
247
+ "normalized": false,
248
+ "rstrip": false,
249
+ "single_word": false,
250
+ "special": false
251
+ },
252
+ "31": {
253
+ "content": " ",
254
+ "lstrip": false,
255
+ "normalized": false,
256
+ "rstrip": false,
257
+ "single_word": false,
258
+ "special": false
259
+ },
260
+ "32": {
261
+ "content": " ",
262
+ "lstrip": false,
263
+ "normalized": false,
264
+ "rstrip": false,
265
+ "single_word": false,
266
+ "special": false
267
+ },
268
+ "33": {
269
+ "content": " ",
270
+ "lstrip": false,
271
+ "normalized": false,
272
+ "rstrip": false,
273
+ "single_word": false,
274
+ "special": false
275
+ },
276
+ "34": {
277
+ "content": "\t\t\t\t\t\t\t\t\t",
278
+ "lstrip": false,
279
+ "normalized": false,
280
+ "rstrip": false,
281
+ "single_word": false,
282
+ "special": false
283
+ },
284
+ "35": {
285
+ "content": "\t\t\t\t\t\t\t\t",
286
+ "lstrip": false,
287
+ "normalized": false,
288
+ "rstrip": false,
289
+ "single_word": false,
290
+ "special": false
291
+ },
292
+ "36": {
293
+ "content": "\t\t\t\t\t\t\t",
294
+ "lstrip": false,
295
+ "normalized": false,
296
+ "rstrip": false,
297
+ "single_word": false,
298
+ "special": false
299
+ },
300
+ "37": {
301
+ "content": "\t\t\t\t\t\t",
302
+ "lstrip": false,
303
+ "normalized": false,
304
+ "rstrip": false,
305
+ "single_word": false,
306
+ "special": false
307
+ },
308
+ "38": {
309
+ "content": "\t\t\t\t\t",
310
+ "lstrip": false,
311
+ "normalized": false,
312
+ "rstrip": false,
313
+ "single_word": false,
314
+ "special": false
315
+ },
316
+ "39": {
317
+ "content": "\t\t\t\t",
318
+ "lstrip": false,
319
+ "normalized": false,
320
+ "rstrip": false,
321
+ "single_word": false,
322
+ "special": false
323
+ },
324
+ "40": {
325
+ "content": "\t\t\t",
326
+ "lstrip": false,
327
+ "normalized": false,
328
+ "rstrip": false,
329
+ "single_word": false,
330
+ "special": false
331
+ },
332
+ "41": {
333
+ "content": "\t\t",
334
+ "lstrip": false,
335
+ "normalized": false,
336
+ "rstrip": false,
337
+ "single_word": false,
338
+ "special": false
339
+ },
340
+ "42": {
341
+ "content": "<|endoftext|>",
342
+ "lstrip": false,
343
+ "normalized": false,
344
+ "rstrip": false,
345
+ "single_word": false,
346
+ "special": true
347
+ },
348
+ "43": {
349
+ "content": "<|c|>",
350
+ "lstrip": false,
351
+ "normalized": false,
352
+ "rstrip": false,
353
+ "single_word": false,
354
+ "special": true
355
+ },
356
+ "44": {
357
+ "content": "<|c++|>",
358
+ "lstrip": false,
359
+ "normalized": false,
360
+ "rstrip": false,
361
+ "single_word": false,
362
+ "special": true
363
+ },
364
+ "45": {
365
+ "content": "<|python|>",
366
+ "lstrip": false,
367
+ "normalized": false,
368
+ "rstrip": false,
369
+ "single_word": false,
370
+ "special": true
371
+ },
372
+ "46": {
373
+ "content": "<|javascript|>",
374
+ "lstrip": false,
375
+ "normalized": false,
376
+ "rstrip": false,
377
+ "single_word": false,
378
+ "special": true
379
+ },
380
+ "47": {
381
+ "content": "<|markdown|>",
382
+ "lstrip": false,
383
+ "normalized": false,
384
+ "rstrip": false,
385
+ "single_word": false,
386
+ "special": true
387
+ },
388
+ "48": {
389
+ "content": "<|html|>",
390
+ "lstrip": false,
391
+ "normalized": false,
392
+ "rstrip": false,
393
+ "single_word": false,
394
+ "special": true
395
+ },
396
+ "49": {
397
+ "content": "<|css|>",
398
+ "lstrip": false,
399
+ "normalized": false,
400
+ "rstrip": false,
401
+ "single_word": false,
402
+ "special": true
403
+ },
404
+ "50": {
405
+ "content": "<|vue|>",
406
+ "lstrip": false,
407
+ "normalized": false,
408
+ "rstrip": false,
409
+ "single_word": false,
410
+ "special": true
411
+ },
412
+ "51": {
413
+ "content": "<|java|>",
414
+ "lstrip": false,
415
+ "normalized": false,
416
+ "rstrip": false,
417
+ "single_word": false,
418
+ "special": true
419
+ },
420
+ "52": {
421
+ "content": "PI:URL",
422
+ "lstrip": false,
423
+ "normalized": false,
424
+ "rstrip": false,
425
+ "single_word": false,
426
+ "special": true
427
+ },
428
+ "53": {
429
+ "content": "PI:EMAIL",
430
+ "lstrip": false,
431
+ "normalized": false,
432
+ "rstrip": false,
433
+ "single_word": false,
434
+ "special": true
435
+ },
436
+ "54": {
437
+ "content": "PI:ACCOUNT_NUM",
438
+ "lstrip": false,
439
+ "normalized": false,
440
+ "rstrip": false,
441
+ "single_word": false,
442
+ "special": true
443
+ },
444
+ "55": {
445
+ "content": "PI:PHONE_NUM",
446
+ "lstrip": false,
447
+ "normalized": false,
448
+ "rstrip": false,
449
+ "single_word": false,
450
+ "special": true
451
+ },
452
+ "56": {
453
+ "content": "PI:BUSINESS_NUM",
454
+ "lstrip": false,
455
+ "normalized": false,
456
+ "rstrip": false,
457
+ "single_word": false,
458
+ "special": true
459
+ },
460
+ "57": {
461
+ "content": "PI:ANNON",
462
+ "lstrip": false,
463
+ "normalized": false,
464
+ "rstrip": false,
465
+ "single_word": false,
466
+ "special": true
467
+ },
468
+ "58": {
469
+ "content": "PI:KEY",
470
+ "lstrip": false,
471
+ "normalized": false,
472
+ "rstrip": false,
473
+ "single_word": false,
474
+ "special": true
475
+ },
476
+ "59": {
477
+ "content": "PI:ID",
478
+ "lstrip": false,
479
+ "normalized": false,
480
+ "rstrip": false,
481
+ "single_word": false,
482
+ "special": true
483
+ },
484
+ "60": {
485
+ "content": "PI:IP_ADDRESS",
486
+ "lstrip": false,
487
+ "normalized": false,
488
+ "rstrip": false,
489
+ "single_word": false,
490
+ "special": true
491
+ },
492
+ "61": {
493
+ "content": "PI:USER",
494
+ "lstrip": false,
495
+ "normalized": false,
496
+ "rstrip": false,
497
+ "single_word": false,
498
+ "special": true
499
+ },
500
+ "62": {
501
+ "content": "[unused0]",
502
+ "lstrip": false,
503
+ "normalized": false,
504
+ "rstrip": false,
505
+ "single_word": false,
506
+ "special": true
507
+ },
508
+ "63": {
509
+ "content": "[unused1]",
510
+ "lstrip": false,
511
+ "normalized": false,
512
+ "rstrip": false,
513
+ "single_word": false,
514
+ "special": true
515
+ },
516
+ "64": {
517
+ "content": "[unused2]",
518
+ "lstrip": false,
519
+ "normalized": false,
520
+ "rstrip": false,
521
+ "single_word": false,
522
+ "special": true
523
+ },
524
+ "65": {
525
+ "content": "[unused3]",
526
+ "lstrip": false,
527
+ "normalized": false,
528
+ "rstrip": false,
529
+ "single_word": false,
530
+ "special": true
531
+ },
532
+ "66": {
533
+ "content": "[unused4]",
534
+ "lstrip": false,
535
+ "normalized": false,
536
+ "rstrip": false,
537
+ "single_word": false,
538
+ "special": true
539
+ },
540
+ "67": {
541
+ "content": "[unused5]",
542
+ "lstrip": false,
543
+ "normalized": false,
544
+ "rstrip": false,
545
+ "single_word": false,
546
+ "special": true
547
+ },
548
+ "68": {
549
+ "content": "[unused6]",
550
+ "lstrip": false,
551
+ "normalized": false,
552
+ "rstrip": false,
553
+ "single_word": false,
554
+ "special": true
555
+ },
556
+ "69": {
557
+ "content": "[unused7]",
558
+ "lstrip": false,
559
+ "normalized": false,
560
+ "rstrip": false,
561
+ "single_word": false,
562
+ "special": true
563
+ },
564
+ "70": {
565
+ "content": "[unused8]",
566
+ "lstrip": false,
567
+ "normalized": false,
568
+ "rstrip": false,
569
+ "single_word": false,
570
+ "special": true
571
+ },
572
+ "71": {
573
+ "content": "[unused9]",
574
+ "lstrip": false,
575
+ "normalized": false,
576
+ "rstrip": false,
577
+ "single_word": false,
578
+ "special": true
579
+ },
580
+ "72": {
581
+ "content": "[unused10]",
582
+ "lstrip": false,
583
+ "normalized": false,
584
+ "rstrip": false,
585
+ "single_word": false,
586
+ "special": true
587
+ },
588
+ "73": {
589
+ "content": "[unused11]",
590
+ "lstrip": false,
591
+ "normalized": false,
592
+ "rstrip": false,
593
+ "single_word": false,
594
+ "special": true
595
+ },
596
+ "74": {
597
+ "content": "[unused12]",
598
+ "lstrip": false,
599
+ "normalized": false,
600
+ "rstrip": false,
601
+ "single_word": false,
602
+ "special": true
603
+ },
604
+ "75": {
605
+ "content": "[unused13]",
606
+ "lstrip": false,
607
+ "normalized": false,
608
+ "rstrip": false,
609
+ "single_word": false,
610
+ "special": true
611
+ },
612
+ "76": {
613
+ "content": "[unused14]",
614
+ "lstrip": false,
615
+ "normalized": false,
616
+ "rstrip": false,
617
+ "single_word": false,
618
+ "special": true
619
+ },
620
+ "77": {
621
+ "content": "[unused15]",
622
+ "lstrip": false,
623
+ "normalized": false,
624
+ "rstrip": false,
625
+ "single_word": false,
626
+ "special": true
627
+ },
628
+ "78": {
629
+ "content": "[unused16]",
630
+ "lstrip": false,
631
+ "normalized": false,
632
+ "rstrip": false,
633
+ "single_word": false,
634
+ "special": true
635
+ },
636
+ "79": {
637
+ "content": "[unused17]",
638
+ "lstrip": false,
639
+ "normalized": false,
640
+ "rstrip": false,
641
+ "single_word": false,
642
+ "special": true
643
+ },
644
+ "80": {
645
+ "content": "[unused18]",
646
+ "lstrip": false,
647
+ "normalized": false,
648
+ "rstrip": false,
649
+ "single_word": false,
650
+ "special": true
651
+ },
652
+ "81": {
653
+ "content": "[unused19]",
654
+ "lstrip": false,
655
+ "normalized": false,
656
+ "rstrip": false,
657
+ "single_word": false,
658
+ "special": true
659
+ },
660
+ "82": {
661
+ "content": "[unused20]",
662
+ "lstrip": false,
663
+ "normalized": false,
664
+ "rstrip": false,
665
+ "single_word": false,
666
+ "special": true
667
+ },
668
+ "83": {
669
+ "content": "[unused21]",
670
+ "lstrip": false,
671
+ "normalized": false,
672
+ "rstrip": false,
673
+ "single_word": false,
674
+ "special": true
675
+ },
676
+ "84": {
677
+ "content": "[unused22]",
678
+ "lstrip": false,
679
+ "normalized": false,
680
+ "rstrip": false,
681
+ "single_word": false,
682
+ "special": true
683
+ },
684
+ "85": {
685
+ "content": "[unused23]",
686
+ "lstrip": false,
687
+ "normalized": false,
688
+ "rstrip": false,
689
+ "single_word": false,
690
+ "special": true
691
+ },
692
+ "86": {
693
+ "content": "[unused24]",
694
+ "lstrip": false,
695
+ "normalized": false,
696
+ "rstrip": false,
697
+ "single_word": false,
698
+ "special": true
699
+ },
700
+ "87": {
701
+ "content": "[unused25]",
702
+ "lstrip": false,
703
+ "normalized": false,
704
+ "rstrip": false,
705
+ "single_word": false,
706
+ "special": true
707
+ },
708
+ "88": {
709
+ "content": "[unused26]",
710
+ "lstrip": false,
711
+ "normalized": false,
712
+ "rstrip": false,
713
+ "single_word": false,
714
+ "special": true
715
+ },
716
+ "89": {
717
+ "content": "[unused27]",
718
+ "lstrip": false,
719
+ "normalized": false,
720
+ "rstrip": false,
721
+ "single_word": false,
722
+ "special": true
723
+ },
724
+ "90": {
725
+ "content": "[unused28]",
726
+ "lstrip": false,
727
+ "normalized": false,
728
+ "rstrip": false,
729
+ "single_word": false,
730
+ "special": true
731
+ },
732
+ "91": {
733
+ "content": "[unused29]",
734
+ "lstrip": false,
735
+ "normalized": false,
736
+ "rstrip": false,
737
+ "single_word": false,
738
+ "special": true
739
+ },
740
+ "92": {
741
+ "content": "[unused30]",
742
+ "lstrip": false,
743
+ "normalized": false,
744
+ "rstrip": false,
745
+ "single_word": false,
746
+ "special": true
747
+ },
748
+ "93": {
749
+ "content": "[unused31]",
750
+ "lstrip": false,
751
+ "normalized": false,
752
+ "rstrip": false,
753
+ "single_word": false,
754
+ "special": true
755
+ },
756
+ "94": {
757
+ "content": "[unused32]",
758
+ "lstrip": false,
759
+ "normalized": false,
760
+ "rstrip": false,
761
+ "single_word": false,
762
+ "special": true
763
+ },
764
+ "95": {
765
+ "content": "[unused33]",
766
+ "lstrip": false,
767
+ "normalized": false,
768
+ "rstrip": false,
769
+ "single_word": false,
770
+ "special": true
771
+ },
772
+ "96": {
773
+ "content": "[unused34]",
774
+ "lstrip": false,
775
+ "normalized": false,
776
+ "rstrip": false,
777
+ "single_word": false,
778
+ "special": true
779
+ },
780
+ "97": {
781
+ "content": "[unused35]",
782
+ "lstrip": false,
783
+ "normalized": false,
784
+ "rstrip": false,
785
+ "single_word": false,
786
+ "special": true
787
+ },
788
+ "98": {
789
+ "content": "[unused36]",
790
+ "lstrip": false,
791
+ "normalized": false,
792
+ "rstrip": false,
793
+ "single_word": false,
794
+ "special": true
795
+ },
796
+ "99": {
797
+ "content": "[unused37]",
798
+ "lstrip": false,
799
+ "normalized": false,
800
+ "rstrip": false,
801
+ "single_word": false,
802
+ "special": true
803
+ },
804
+ "100": {
805
+ "content": "[unused38]",
806
+ "lstrip": false,
807
+ "normalized": false,
808
+ "rstrip": false,
809
+ "single_word": false,
810
+ "special": true
811
+ },
812
+ "101": {
813
+ "content": "[unused39]",
814
+ "lstrip": false,
815
+ "normalized": false,
816
+ "rstrip": false,
817
+ "single_word": false,
818
+ "special": true
819
+ },
820
+ "102": {
821
+ "content": "[unused40]",
822
+ "lstrip": false,
823
+ "normalized": false,
824
+ "rstrip": false,
825
+ "single_word": false,
826
+ "special": true
827
+ },
828
+ "103": {
829
+ "content": "[unused41]",
830
+ "lstrip": false,
831
+ "normalized": false,
832
+ "rstrip": false,
833
+ "single_word": false,
834
+ "special": true
835
+ },
836
+ "104": {
837
+ "content": "[unused42]",
838
+ "lstrip": false,
839
+ "normalized": false,
840
+ "rstrip": false,
841
+ "single_word": false,
842
+ "special": true
843
+ },
844
+ "105": {
845
+ "content": "[unused43]",
846
+ "lstrip": false,
847
+ "normalized": false,
848
+ "rstrip": false,
849
+ "single_word": false,
850
+ "special": true
851
+ },
852
+ "106": {
853
+ "content": "[unused44]",
854
+ "lstrip": false,
855
+ "normalized": false,
856
+ "rstrip": false,
857
+ "single_word": false,
858
+ "special": true
859
+ },
860
+ "107": {
861
+ "content": "[unused45]",
862
+ "lstrip": false,
863
+ "normalized": false,
864
+ "rstrip": false,
865
+ "single_word": false,
866
+ "special": true
867
+ },
868
+ "108": {
869
+ "content": "[unused46]",
870
+ "lstrip": false,
871
+ "normalized": false,
872
+ "rstrip": false,
873
+ "single_word": false,
874
+ "special": true
875
+ },
876
+ "109": {
877
+ "content": "[unused47]",
878
+ "lstrip": false,
879
+ "normalized": false,
880
+ "rstrip": false,
881
+ "single_word": false,
882
+ "special": true
883
+ },
884
+ "110": {
885
+ "content": "[unused48]",
886
+ "lstrip": false,
887
+ "normalized": false,
888
+ "rstrip": false,
889
+ "single_word": false,
890
+ "special": true
891
+ },
892
+ "111": {
893
+ "content": "[unused49]",
894
+ "lstrip": false,
895
+ "normalized": false,
896
+ "rstrip": false,
897
+ "single_word": false,
898
+ "special": true
899
+ },
900
+ "112": {
901
+ "content": "[unused50]",
902
+ "lstrip": false,
903
+ "normalized": false,
904
+ "rstrip": false,
905
+ "single_word": false,
906
+ "special": true
907
+ },
908
+ "113": {
909
+ "content": "[unused51]",
910
+ "lstrip": false,
911
+ "normalized": false,
912
+ "rstrip": false,
913
+ "single_word": false,
914
+ "special": true
915
+ },
916
+ "114": {
917
+ "content": "[unused52]",
918
+ "lstrip": false,
919
+ "normalized": false,
920
+ "rstrip": false,
921
+ "single_word": false,
922
+ "special": true
923
+ },
924
+ "115": {
925
+ "content": "[unused53]",
926
+ "lstrip": false,
927
+ "normalized": false,
928
+ "rstrip": false,
929
+ "single_word": false,
930
+ "special": true
931
+ },
932
+ "116": {
933
+ "content": "[unused54]",
934
+ "lstrip": false,
935
+ "normalized": false,
936
+ "rstrip": false,
937
+ "single_word": false,
938
+ "special": true
939
+ },
940
+ "117": {
941
+ "content": "[unused55]",
942
+ "lstrip": false,
943
+ "normalized": false,
944
+ "rstrip": false,
945
+ "single_word": false,
946
+ "special": true
947
+ },
948
+ "118": {
949
+ "content": "[unused56]",
950
+ "lstrip": false,
951
+ "normalized": false,
952
+ "rstrip": false,
953
+ "single_word": false,
954
+ "special": true
955
+ },
956
+ "119": {
957
+ "content": "[unused57]",
958
+ "lstrip": false,
959
+ "normalized": false,
960
+ "rstrip": false,
961
+ "single_word": false,
962
+ "special": true
963
+ },
964
+ "120": {
965
+ "content": "[unused58]",
966
+ "lstrip": false,
967
+ "normalized": false,
968
+ "rstrip": false,
969
+ "single_word": false,
970
+ "special": true
971
+ },
972
+ "121": {
973
+ "content": "[unused59]",
974
+ "lstrip": false,
975
+ "normalized": false,
976
+ "rstrip": false,
977
+ "single_word": false,
978
+ "special": true
979
+ },
980
+ "122": {
981
+ "content": "[unused60]",
982
+ "lstrip": false,
983
+ "normalized": false,
984
+ "rstrip": false,
985
+ "single_word": false,
986
+ "special": true
987
+ },
988
+ "123": {
989
+ "content": "[unused61]",
990
+ "lstrip": false,
991
+ "normalized": false,
992
+ "rstrip": false,
993
+ "single_word": false,
994
+ "special": true
995
+ },
996
+ "124": {
997
+ "content": "[unused62]",
998
+ "lstrip": false,
999
+ "normalized": false,
1000
+ "rstrip": false,
1001
+ "single_word": false,
1002
+ "special": true
1003
+ },
1004
+ "125": {
1005
+ "content": "[unused63]",
1006
+ "lstrip": false,
1007
+ "normalized": false,
1008
+ "rstrip": false,
1009
+ "single_word": false,
1010
+ "special": true
1011
+ },
1012
+ "126": {
1013
+ "content": "[unused64]",
1014
+ "lstrip": false,
1015
+ "normalized": false,
1016
+ "rstrip": false,
1017
+ "single_word": false,
1018
+ "special": true
1019
+ },
1020
+ "127": {
1021
+ "content": "[unused65]",
1022
+ "lstrip": false,
1023
+ "normalized": false,
1024
+ "rstrip": false,
1025
+ "single_word": false,
1026
+ "special": true
1027
+ },
1028
+ "128": {
1029
+ "content": "[unused66]",
1030
+ "lstrip": false,
1031
+ "normalized": false,
1032
+ "rstrip": false,
1033
+ "single_word": false,
1034
+ "special": true
1035
+ },
1036
+ "129": {
1037
+ "content": "[unused67]",
1038
+ "lstrip": false,
1039
+ "normalized": false,
1040
+ "rstrip": false,
1041
+ "single_word": false,
1042
+ "special": true
1043
+ },
1044
+ "130": {
1045
+ "content": "[unused68]",
1046
+ "lstrip": false,
1047
+ "normalized": false,
1048
+ "rstrip": false,
1049
+ "single_word": false,
1050
+ "special": true
1051
+ },
1052
+ "131": {
1053
+ "content": "[unused69]",
1054
+ "lstrip": false,
1055
+ "normalized": false,
1056
+ "rstrip": false,
1057
+ "single_word": false,
1058
+ "special": true
1059
+ },
1060
+ "132": {
1061
+ "content": "[unused70]",
1062
+ "lstrip": false,
1063
+ "normalized": false,
1064
+ "rstrip": false,
1065
+ "single_word": false,
1066
+ "special": true
1067
+ },
1068
+ "133": {
1069
+ "content": "[unused71]",
1070
+ "lstrip": false,
1071
+ "normalized": false,
1072
+ "rstrip": false,
1073
+ "single_word": false,
1074
+ "special": true
1075
+ },
1076
+ "134": {
1077
+ "content": "[unused72]",
1078
+ "lstrip": false,
1079
+ "normalized": false,
1080
+ "rstrip": false,
1081
+ "single_word": false,
1082
+ "special": true
1083
+ },
1084
+ "135": {
1085
+ "content": "[unused73]",
1086
+ "lstrip": false,
1087
+ "normalized": false,
1088
+ "rstrip": false,
1089
+ "single_word": false,
1090
+ "special": true
1091
+ },
1092
+ "136": {
1093
+ "content": "[unused74]",
1094
+ "lstrip": false,
1095
+ "normalized": false,
1096
+ "rstrip": false,
1097
+ "single_word": false,
1098
+ "special": true
1099
+ },
1100
+ "137": {
1101
+ "content": "[unused75]",
1102
+ "lstrip": false,
1103
+ "normalized": false,
1104
+ "rstrip": false,
1105
+ "single_word": false,
1106
+ "special": true
1107
+ },
1108
+ "138": {
1109
+ "content": "[unused76]",
1110
+ "lstrip": false,
1111
+ "normalized": false,
1112
+ "rstrip": false,
1113
+ "single_word": false,
1114
+ "special": true
1115
+ },
1116
+ "139": {
1117
+ "content": "[unused77]",
1118
+ "lstrip": false,
1119
+ "normalized": false,
1120
+ "rstrip": false,
1121
+ "single_word": false,
1122
+ "special": true
1123
+ },
1124
+ "140": {
1125
+ "content": "[unused78]",
1126
+ "lstrip": false,
1127
+ "normalized": false,
1128
+ "rstrip": false,
1129
+ "single_word": false,
1130
+ "special": true
1131
+ },
1132
+ "141": {
1133
+ "content": "[unused79]",
1134
+ "lstrip": false,
1135
+ "normalized": false,
1136
+ "rstrip": false,
1137
+ "single_word": false,
1138
+ "special": true
1139
+ },
1140
+ "142": {
1141
+ "content": "[unused80]",
1142
+ "lstrip": false,
1143
+ "normalized": false,
1144
+ "rstrip": false,
1145
+ "single_word": false,
1146
+ "special": true
1147
+ },
1148
+ "143": {
1149
+ "content": "[unused81]",
1150
+ "lstrip": false,
1151
+ "normalized": false,
1152
+ "rstrip": false,
1153
+ "single_word": false,
1154
+ "special": true
1155
+ },
1156
+ "144": {
1157
+ "content": "[unused82]",
1158
+ "lstrip": false,
1159
+ "normalized": false,
1160
+ "rstrip": false,
1161
+ "single_word": false,
1162
+ "special": true
1163
+ },
1164
+ "145": {
1165
+ "content": "[unused83]",
1166
+ "lstrip": false,
1167
+ "normalized": false,
1168
+ "rstrip": false,
1169
+ "single_word": false,
1170
+ "special": true
1171
+ },
1172
+ "146": {
1173
+ "content": "[unused84]",
1174
+ "lstrip": false,
1175
+ "normalized": false,
1176
+ "rstrip": false,
1177
+ "single_word": false,
1178
+ "special": true
1179
+ },
1180
+ "147": {
1181
+ "content": "[unused85]",
1182
+ "lstrip": false,
1183
+ "normalized": false,
1184
+ "rstrip": false,
1185
+ "single_word": false,
1186
+ "special": true
1187
+ },
1188
+ "148": {
1189
+ "content": "[unused86]",
1190
+ "lstrip": false,
1191
+ "normalized": false,
1192
+ "rstrip": false,
1193
+ "single_word": false,
1194
+ "special": true
1195
+ },
1196
+ "149": {
1197
+ "content": "[unused87]",
1198
+ "lstrip": false,
1199
+ "normalized": false,
1200
+ "rstrip": false,
1201
+ "single_word": false,
1202
+ "special": true
1203
+ },
1204
+ "150": {
1205
+ "content": "[unused88]",
1206
+ "lstrip": false,
1207
+ "normalized": false,
1208
+ "rstrip": false,
1209
+ "single_word": false,
1210
+ "special": true
1211
+ },
1212
+ "151": {
1213
+ "content": "[unused89]",
1214
+ "lstrip": false,
1215
+ "normalized": false,
1216
+ "rstrip": false,
1217
+ "single_word": false,
1218
+ "special": true
1219
+ },
1220
+ "152": {
1221
+ "content": "[unused90]",
1222
+ "lstrip": false,
1223
+ "normalized": false,
1224
+ "rstrip": false,
1225
+ "single_word": false,
1226
+ "special": true
1227
+ },
1228
+ "153": {
1229
+ "content": "[unused91]",
1230
+ "lstrip": false,
1231
+ "normalized": false,
1232
+ "rstrip": false,
1233
+ "single_word": false,
1234
+ "special": true
1235
+ },
1236
+ "154": {
1237
+ "content": "[unused92]",
1238
+ "lstrip": false,
1239
+ "normalized": false,
1240
+ "rstrip": false,
1241
+ "single_word": false,
1242
+ "special": true
1243
+ },
1244
+ "155": {
1245
+ "content": "[unused93]",
1246
+ "lstrip": false,
1247
+ "normalized": false,
1248
+ "rstrip": false,
1249
+ "single_word": false,
1250
+ "special": true
1251
+ },
1252
+ "156": {
1253
+ "content": "[unused94]",
1254
+ "lstrip": false,
1255
+ "normalized": false,
1256
+ "rstrip": false,
1257
+ "single_word": false,
1258
+ "special": true
1259
+ },
1260
+ "157": {
1261
+ "content": "[unused95]",
1262
+ "lstrip": false,
1263
+ "normalized": false,
1264
+ "rstrip": false,
1265
+ "single_word": false,
1266
+ "special": true
1267
+ },
1268
+ "158": {
1269
+ "content": "[unused96]",
1270
+ "lstrip": false,
1271
+ "normalized": false,
1272
+ "rstrip": false,
1273
+ "single_word": false,
1274
+ "special": true
1275
+ },
1276
+ "159": {
1277
+ "content": "[unused97]",
1278
+ "lstrip": false,
1279
+ "normalized": false,
1280
+ "rstrip": false,
1281
+ "single_word": false,
1282
+ "special": true
1283
+ },
1284
+ "160": {
1285
+ "content": "[unused98]",
1286
+ "lstrip": false,
1287
+ "normalized": false,
1288
+ "rstrip": false,
1289
+ "single_word": false,
1290
+ "special": true
1291
+ },
1292
+ "161": {
1293
+ "content": "[unused99]",
1294
+ "lstrip": false,
1295
+ "normalized": false,
1296
+ "rstrip": false,
1297
+ "single_word": false,
1298
+ "special": true
1299
+ },
1300
+ "162": {
1301
+ "content": "[extra_id_0]",
1302
+ "lstrip": false,
1303
+ "normalized": false,
1304
+ "rstrip": false,
1305
+ "single_word": false,
1306
+ "special": true
1307
+ },
1308
+ "163": {
1309
+ "content": "[extra_id_1]",
1310
+ "lstrip": false,
1311
+ "normalized": false,
1312
+ "rstrip": false,
1313
+ "single_word": false,
1314
+ "special": true
1315
+ },
1316
+ "164": {
1317
+ "content": "[extra_id_2]",
1318
+ "lstrip": false,
1319
+ "normalized": false,
1320
+ "rstrip": false,
1321
+ "single_word": false,
1322
+ "special": true
1323
+ },
1324
+ "165": {
1325
+ "content": "[extra_id_3]",
1326
+ "lstrip": false,
1327
+ "normalized": false,
1328
+ "rstrip": false,
1329
+ "single_word": false,
1330
+ "special": true
1331
+ },
1332
+ "166": {
1333
+ "content": "[extra_id_4]",
1334
+ "lstrip": false,
1335
+ "normalized": false,
1336
+ "rstrip": false,
1337
+ "single_word": false,
1338
+ "special": true
1339
+ },
1340
+ "167": {
1341
+ "content": "[extra_id_5]",
1342
+ "lstrip": false,
1343
+ "normalized": false,
1344
+ "rstrip": false,
1345
+ "single_word": false,
1346
+ "special": true
1347
+ },
1348
+ "168": {
1349
+ "content": "[extra_id_6]",
1350
+ "lstrip": false,
1351
+ "normalized": false,
1352
+ "rstrip": false,
1353
+ "single_word": false,
1354
+ "special": true
1355
+ },
1356
+ "169": {
1357
+ "content": "[extra_id_7]",
1358
+ "lstrip": false,
1359
+ "normalized": false,
1360
+ "rstrip": false,
1361
+ "single_word": false,
1362
+ "special": true
1363
+ },
1364
+ "170": {
1365
+ "content": "[extra_id_8]",
1366
+ "lstrip": false,
1367
+ "normalized": false,
1368
+ "rstrip": false,
1369
+ "single_word": false,
1370
+ "special": true
1371
+ },
1372
+ "171": {
1373
+ "content": "[extra_id_9]",
1374
+ "lstrip": false,
1375
+ "normalized": false,
1376
+ "rstrip": false,
1377
+ "single_word": false,
1378
+ "special": true
1379
+ },
1380
+ "172": {
1381
+ "content": "[extra_id_10]",
1382
+ "lstrip": false,
1383
+ "normalized": false,
1384
+ "rstrip": false,
1385
+ "single_word": false,
1386
+ "special": true
1387
+ },
1388
+ "173": {
1389
+ "content": "[extra_id_11]",
1390
+ "lstrip": false,
1391
+ "normalized": false,
1392
+ "rstrip": false,
1393
+ "single_word": false,
1394
+ "special": true
1395
+ },
1396
+ "174": {
1397
+ "content": "[extra_id_12]",
1398
+ "lstrip": false,
1399
+ "normalized": false,
1400
+ "rstrip": false,
1401
+ "single_word": false,
1402
+ "special": true
1403
+ },
1404
+ "175": {
1405
+ "content": "[extra_id_13]",
1406
+ "lstrip": false,
1407
+ "normalized": false,
1408
+ "rstrip": false,
1409
+ "single_word": false,
1410
+ "special": true
1411
+ },
1412
+ "176": {
1413
+ "content": "[extra_id_14]",
1414
+ "lstrip": false,
1415
+ "normalized": false,
1416
+ "rstrip": false,
1417
+ "single_word": false,
1418
+ "special": true
1419
+ },
1420
+ "177": {
1421
+ "content": "[extra_id_15]",
1422
+ "lstrip": false,
1423
+ "normalized": false,
1424
+ "rstrip": false,
1425
+ "single_word": false,
1426
+ "special": true
1427
+ },
1428
+ "178": {
1429
+ "content": "[extra_id_16]",
1430
+ "lstrip": false,
1431
+ "normalized": false,
1432
+ "rstrip": false,
1433
+ "single_word": false,
1434
+ "special": true
1435
+ },
1436
+ "179": {
1437
+ "content": "[extra_id_17]",
1438
+ "lstrip": false,
1439
+ "normalized": false,
1440
+ "rstrip": false,
1441
+ "single_word": false,
1442
+ "special": true
1443
+ },
1444
+ "180": {
1445
+ "content": "[extra_id_18]",
1446
+ "lstrip": false,
1447
+ "normalized": false,
1448
+ "rstrip": false,
1449
+ "single_word": false,
1450
+ "special": true
1451
+ },
1452
+ "181": {
1453
+ "content": "[extra_id_19]",
1454
+ "lstrip": false,
1455
+ "normalized": false,
1456
+ "rstrip": false,
1457
+ "single_word": false,
1458
+ "special": true
1459
+ },
1460
+ "182": {
1461
+ "content": "[extra_id_20]",
1462
+ "lstrip": false,
1463
+ "normalized": false,
1464
+ "rstrip": false,
1465
+ "single_word": false,
1466
+ "special": true
1467
+ },
1468
+ "183": {
1469
+ "content": "[extra_id_21]",
1470
+ "lstrip": false,
1471
+ "normalized": false,
1472
+ "rstrip": false,
1473
+ "single_word": false,
1474
+ "special": true
1475
+ },
1476
+ "184": {
1477
+ "content": "[extra_id_22]",
1478
+ "lstrip": false,
1479
+ "normalized": false,
1480
+ "rstrip": false,
1481
+ "single_word": false,
1482
+ "special": true
1483
+ },
1484
+ "185": {
1485
+ "content": "[extra_id_23]",
1486
+ "lstrip": false,
1487
+ "normalized": false,
1488
+ "rstrip": false,
1489
+ "single_word": false,
1490
+ "special": true
1491
+ },
1492
+ "186": {
1493
+ "content": "[extra_id_24]",
1494
+ "lstrip": false,
1495
+ "normalized": false,
1496
+ "rstrip": false,
1497
+ "single_word": false,
1498
+ "special": true
1499
+ },
1500
+ "187": {
1501
+ "content": "[extra_id_25]",
1502
+ "lstrip": false,
1503
+ "normalized": false,
1504
+ "rstrip": false,
1505
+ "single_word": false,
1506
+ "special": true
1507
+ },
1508
+ "188": {
1509
+ "content": "[extra_id_26]",
1510
+ "lstrip": false,
1511
+ "normalized": false,
1512
+ "rstrip": false,
1513
+ "single_word": false,
1514
+ "special": true
1515
+ },
1516
+ "189": {
1517
+ "content": "[extra_id_27]",
1518
+ "lstrip": false,
1519
+ "normalized": false,
1520
+ "rstrip": false,
1521
+ "single_word": false,
1522
+ "special": true
1523
+ },
1524
+ "190": {
1525
+ "content": "[extra_id_28]",
1526
+ "lstrip": false,
1527
+ "normalized": false,
1528
+ "rstrip": false,
1529
+ "single_word": false,
1530
+ "special": true
1531
+ },
1532
+ "191": {
1533
+ "content": "[extra_id_29]",
1534
+ "lstrip": false,
1535
+ "normalized": false,
1536
+ "rstrip": false,
1537
+ "single_word": false,
1538
+ "special": true
1539
+ },
1540
+ "192": {
1541
+ "content": "[extra_id_30]",
1542
+ "lstrip": false,
1543
+ "normalized": false,
1544
+ "rstrip": false,
1545
+ "single_word": false,
1546
+ "special": true
1547
+ },
1548
+ "193": {
1549
+ "content": "[extra_id_31]",
1550
+ "lstrip": false,
1551
+ "normalized": false,
1552
+ "rstrip": false,
1553
+ "single_word": false,
1554
+ "special": true
1555
+ },
1556
+ "194": {
1557
+ "content": "[extra_id_32]",
1558
+ "lstrip": false,
1559
+ "normalized": false,
1560
+ "rstrip": false,
1561
+ "single_word": false,
1562
+ "special": true
1563
+ },
1564
+ "195": {
1565
+ "content": "[extra_id_33]",
1566
+ "lstrip": false,
1567
+ "normalized": false,
1568
+ "rstrip": false,
1569
+ "single_word": false,
1570
+ "special": true
1571
+ },
1572
+ "196": {
1573
+ "content": "[extra_id_34]",
1574
+ "lstrip": false,
1575
+ "normalized": false,
1576
+ "rstrip": false,
1577
+ "single_word": false,
1578
+ "special": true
1579
+ },
1580
+ "197": {
1581
+ "content": "[extra_id_35]",
1582
+ "lstrip": false,
1583
+ "normalized": false,
1584
+ "rstrip": false,
1585
+ "single_word": false,
1586
+ "special": true
1587
+ },
1588
+ "198": {
1589
+ "content": "[extra_id_36]",
1590
+ "lstrip": false,
1591
+ "normalized": false,
1592
+ "rstrip": false,
1593
+ "single_word": false,
1594
+ "special": true
1595
+ },
1596
+ "199": {
1597
+ "content": "[extra_id_37]",
1598
+ "lstrip": false,
1599
+ "normalized": false,
1600
+ "rstrip": false,
1601
+ "single_word": false,
1602
+ "special": true
1603
+ },
1604
+ "200": {
1605
+ "content": "[extra_id_38]",
1606
+ "lstrip": false,
1607
+ "normalized": false,
1608
+ "rstrip": false,
1609
+ "single_word": false,
1610
+ "special": true
1611
+ },
1612
+ "201": {
1613
+ "content": "[extra_id_39]",
1614
+ "lstrip": false,
1615
+ "normalized": false,
1616
+ "rstrip": false,
1617
+ "single_word": false,
1618
+ "special": true
1619
+ },
1620
+ "202": {
1621
+ "content": "[extra_id_40]",
1622
+ "lstrip": false,
1623
+ "normalized": false,
1624
+ "rstrip": false,
1625
+ "single_word": false,
1626
+ "special": true
1627
+ },
1628
+ "203": {
1629
+ "content": "[extra_id_41]",
1630
+ "lstrip": false,
1631
+ "normalized": false,
1632
+ "rstrip": false,
1633
+ "single_word": false,
1634
+ "special": true
1635
+ },
1636
+ "204": {
1637
+ "content": "[extra_id_42]",
1638
+ "lstrip": false,
1639
+ "normalized": false,
1640
+ "rstrip": false,
1641
+ "single_word": false,
1642
+ "special": true
1643
+ },
1644
+ "205": {
1645
+ "content": "[extra_id_43]",
1646
+ "lstrip": false,
1647
+ "normalized": false,
1648
+ "rstrip": false,
1649
+ "single_word": false,
1650
+ "special": true
1651
+ },
1652
+ "206": {
1653
+ "content": "[extra_id_44]",
1654
+ "lstrip": false,
1655
+ "normalized": false,
1656
+ "rstrip": false,
1657
+ "single_word": false,
1658
+ "special": true
1659
+ },
1660
+ "207": {
1661
+ "content": "[extra_id_45]",
1662
+ "lstrip": false,
1663
+ "normalized": false,
1664
+ "rstrip": false,
1665
+ "single_word": false,
1666
+ "special": true
1667
+ },
1668
+ "208": {
1669
+ "content": "[extra_id_46]",
1670
+ "lstrip": false,
1671
+ "normalized": false,
1672
+ "rstrip": false,
1673
+ "single_word": false,
1674
+ "special": true
1675
+ },
1676
+ "209": {
1677
+ "content": "[extra_id_47]",
1678
+ "lstrip": false,
1679
+ "normalized": false,
1680
+ "rstrip": false,
1681
+ "single_word": false,
1682
+ "special": true
1683
+ },
1684
+ "210": {
1685
+ "content": "[extra_id_48]",
1686
+ "lstrip": false,
1687
+ "normalized": false,
1688
+ "rstrip": false,
1689
+ "single_word": false,
1690
+ "special": true
1691
+ },
1692
+ "211": {
1693
+ "content": "[extra_id_49]",
1694
+ "lstrip": false,
1695
+ "normalized": false,
1696
+ "rstrip": false,
1697
+ "single_word": false,
1698
+ "special": true
1699
+ },
1700
+ "212": {
1701
+ "content": "[extra_id_50]",
1702
+ "lstrip": false,
1703
+ "normalized": false,
1704
+ "rstrip": false,
1705
+ "single_word": false,
1706
+ "special": true
1707
+ },
1708
+ "213": {
1709
+ "content": "[extra_id_51]",
1710
+ "lstrip": false,
1711
+ "normalized": false,
1712
+ "rstrip": false,
1713
+ "single_word": false,
1714
+ "special": true
1715
+ },
1716
+ "214": {
1717
+ "content": "[extra_id_52]",
1718
+ "lstrip": false,
1719
+ "normalized": false,
1720
+ "rstrip": false,
1721
+ "single_word": false,
1722
+ "special": true
1723
+ },
1724
+ "215": {
1725
+ "content": "[extra_id_53]",
1726
+ "lstrip": false,
1727
+ "normalized": false,
1728
+ "rstrip": false,
1729
+ "single_word": false,
1730
+ "special": true
1731
+ },
1732
+ "216": {
1733
+ "content": "[extra_id_54]",
1734
+ "lstrip": false,
1735
+ "normalized": false,
1736
+ "rstrip": false,
1737
+ "single_word": false,
1738
+ "special": true
1739
+ },
1740
+ "217": {
1741
+ "content": "[extra_id_55]",
1742
+ "lstrip": false,
1743
+ "normalized": false,
1744
+ "rstrip": false,
1745
+ "single_word": false,
1746
+ "special": true
1747
+ },
1748
+ "218": {
1749
+ "content": "[extra_id_56]",
1750
+ "lstrip": false,
1751
+ "normalized": false,
1752
+ "rstrip": false,
1753
+ "single_word": false,
1754
+ "special": true
1755
+ },
1756
+ "219": {
1757
+ "content": "[extra_id_57]",
1758
+ "lstrip": false,
1759
+ "normalized": false,
1760
+ "rstrip": false,
1761
+ "single_word": false,
1762
+ "special": true
1763
+ },
1764
+ "220": {
1765
+ "content": "[extra_id_58]",
1766
+ "lstrip": false,
1767
+ "normalized": false,
1768
+ "rstrip": false,
1769
+ "single_word": false,
1770
+ "special": true
1771
+ },
1772
+ "221": {
1773
+ "content": "[extra_id_59]",
1774
+ "lstrip": false,
1775
+ "normalized": false,
1776
+ "rstrip": false,
1777
+ "single_word": false,
1778
+ "special": true
1779
+ },
1780
+ "222": {
1781
+ "content": "[extra_id_60]",
1782
+ "lstrip": false,
1783
+ "normalized": false,
1784
+ "rstrip": false,
1785
+ "single_word": false,
1786
+ "special": true
1787
+ },
1788
+ "223": {
1789
+ "content": "[extra_id_61]",
1790
+ "lstrip": false,
1791
+ "normalized": false,
1792
+ "rstrip": false,
1793
+ "single_word": false,
1794
+ "special": true
1795
+ },
1796
+ "224": {
1797
+ "content": "[extra_id_62]",
1798
+ "lstrip": false,
1799
+ "normalized": false,
1800
+ "rstrip": false,
1801
+ "single_word": false,
1802
+ "special": true
1803
+ },
1804
+ "225": {
1805
+ "content": "[extra_id_63]",
1806
+ "lstrip": false,
1807
+ "normalized": false,
1808
+ "rstrip": false,
1809
+ "single_word": false,
1810
+ "special": true
1811
+ },
1812
+ "226": {
1813
+ "content": "[extra_id_64]",
1814
+ "lstrip": false,
1815
+ "normalized": false,
1816
+ "rstrip": false,
1817
+ "single_word": false,
1818
+ "special": true
1819
+ },
1820
+ "227": {
1821
+ "content": "[extra_id_65]",
1822
+ "lstrip": false,
1823
+ "normalized": false,
1824
+ "rstrip": false,
1825
+ "single_word": false,
1826
+ "special": true
1827
+ },
1828
+ "228": {
1829
+ "content": "[extra_id_66]",
1830
+ "lstrip": false,
1831
+ "normalized": false,
1832
+ "rstrip": false,
1833
+ "single_word": false,
1834
+ "special": true
1835
+ },
1836
+ "229": {
1837
+ "content": "[extra_id_67]",
1838
+ "lstrip": false,
1839
+ "normalized": false,
1840
+ "rstrip": false,
1841
+ "single_word": false,
1842
+ "special": true
1843
+ },
1844
+ "230": {
1845
+ "content": "[extra_id_68]",
1846
+ "lstrip": false,
1847
+ "normalized": false,
1848
+ "rstrip": false,
1849
+ "single_word": false,
1850
+ "special": true
1851
+ },
1852
+ "231": {
1853
+ "content": "[extra_id_69]",
1854
+ "lstrip": false,
1855
+ "normalized": false,
1856
+ "rstrip": false,
1857
+ "single_word": false,
1858
+ "special": true
1859
+ },
1860
+ "232": {
1861
+ "content": "[extra_id_70]",
1862
+ "lstrip": false,
1863
+ "normalized": false,
1864
+ "rstrip": false,
1865
+ "single_word": false,
1866
+ "special": true
1867
+ },
1868
+ "233": {
1869
+ "content": "[extra_id_71]",
1870
+ "lstrip": false,
1871
+ "normalized": false,
1872
+ "rstrip": false,
1873
+ "single_word": false,
1874
+ "special": true
1875
+ },
1876
+ "234": {
1877
+ "content": "[extra_id_72]",
1878
+ "lstrip": false,
1879
+ "normalized": false,
1880
+ "rstrip": false,
1881
+ "single_word": false,
1882
+ "special": true
1883
+ },
1884
+ "235": {
1885
+ "content": "[extra_id_73]",
1886
+ "lstrip": false,
1887
+ "normalized": false,
1888
+ "rstrip": false,
1889
+ "single_word": false,
1890
+ "special": true
1891
+ },
1892
+ "236": {
1893
+ "content": "[extra_id_74]",
1894
+ "lstrip": false,
1895
+ "normalized": false,
1896
+ "rstrip": false,
1897
+ "single_word": false,
1898
+ "special": true
1899
+ },
1900
+ "237": {
1901
+ "content": "[extra_id_75]",
1902
+ "lstrip": false,
1903
+ "normalized": false,
1904
+ "rstrip": false,
1905
+ "single_word": false,
1906
+ "special": true
1907
+ },
1908
+ "238": {
1909
+ "content": "[extra_id_76]",
1910
+ "lstrip": false,
1911
+ "normalized": false,
1912
+ "rstrip": false,
1913
+ "single_word": false,
1914
+ "special": true
1915
+ },
1916
+ "239": {
1917
+ "content": "[extra_id_77]",
1918
+ "lstrip": false,
1919
+ "normalized": false,
1920
+ "rstrip": false,
1921
+ "single_word": false,
1922
+ "special": true
1923
+ },
1924
+ "240": {
1925
+ "content": "[extra_id_78]",
1926
+ "lstrip": false,
1927
+ "normalized": false,
1928
+ "rstrip": false,
1929
+ "single_word": false,
1930
+ "special": true
1931
+ },
1932
+ "241": {
1933
+ "content": "[extra_id_79]",
1934
+ "lstrip": false,
1935
+ "normalized": false,
1936
+ "rstrip": false,
1937
+ "single_word": false,
1938
+ "special": true
1939
+ },
1940
+ "242": {
1941
+ "content": "[extra_id_80]",
1942
+ "lstrip": false,
1943
+ "normalized": false,
1944
+ "rstrip": false,
1945
+ "single_word": false,
1946
+ "special": true
1947
+ },
1948
+ "243": {
1949
+ "content": "[extra_id_81]",
1950
+ "lstrip": false,
1951
+ "normalized": false,
1952
+ "rstrip": false,
1953
+ "single_word": false,
1954
+ "special": true
1955
+ },
1956
+ "244": {
1957
+ "content": "[extra_id_82]",
1958
+ "lstrip": false,
1959
+ "normalized": false,
1960
+ "rstrip": false,
1961
+ "single_word": false,
1962
+ "special": true
1963
+ },
1964
+ "245": {
1965
+ "content": "[extra_id_83]",
1966
+ "lstrip": false,
1967
+ "normalized": false,
1968
+ "rstrip": false,
1969
+ "single_word": false,
1970
+ "special": true
1971
+ },
1972
+ "246": {
1973
+ "content": "[extra_id_84]",
1974
+ "lstrip": false,
1975
+ "normalized": false,
1976
+ "rstrip": false,
1977
+ "single_word": false,
1978
+ "special": true
1979
+ },
1980
+ "247": {
1981
+ "content": "[extra_id_85]",
1982
+ "lstrip": false,
1983
+ "normalized": false,
1984
+ "rstrip": false,
1985
+ "single_word": false,
1986
+ "special": true
1987
+ },
1988
+ "248": {
1989
+ "content": "[extra_id_86]",
1990
+ "lstrip": false,
1991
+ "normalized": false,
1992
+ "rstrip": false,
1993
+ "single_word": false,
1994
+ "special": true
1995
+ },
1996
+ "249": {
1997
+ "content": "[extra_id_87]",
1998
+ "lstrip": false,
1999
+ "normalized": false,
2000
+ "rstrip": false,
2001
+ "single_word": false,
2002
+ "special": true
2003
+ },
2004
+ "250": {
2005
+ "content": "[extra_id_88]",
2006
+ "lstrip": false,
2007
+ "normalized": false,
2008
+ "rstrip": false,
2009
+ "single_word": false,
2010
+ "special": true
2011
+ },
2012
+ "251": {
2013
+ "content": "[extra_id_89]",
2014
+ "lstrip": false,
2015
+ "normalized": false,
2016
+ "rstrip": false,
2017
+ "single_word": false,
2018
+ "special": true
2019
+ },
2020
+ "252": {
2021
+ "content": "[extra_id_90]",
2022
+ "lstrip": false,
2023
+ "normalized": false,
2024
+ "rstrip": false,
2025
+ "single_word": false,
2026
+ "special": true
2027
+ },
2028
+ "253": {
2029
+ "content": "[extra_id_91]",
2030
+ "lstrip": false,
2031
+ "normalized": false,
2032
+ "rstrip": false,
2033
+ "single_word": false,
2034
+ "special": true
2035
+ },
2036
+ "254": {
2037
+ "content": "[extra_id_92]",
2038
+ "lstrip": false,
2039
+ "normalized": false,
2040
+ "rstrip": false,
2041
+ "single_word": false,
2042
+ "special": true
2043
+ },
2044
+ "255": {
2045
+ "content": "[extra_id_93]",
2046
+ "lstrip": false,
2047
+ "normalized": false,
2048
+ "rstrip": false,
2049
+ "single_word": false,
2050
+ "special": true
2051
+ },
2052
+ "256": {
2053
+ "content": "[extra_id_94]",
2054
+ "lstrip": false,
2055
+ "normalized": false,
2056
+ "rstrip": false,
2057
+ "single_word": false,
2058
+ "special": true
2059
+ },
2060
+ "257": {
2061
+ "content": "[extra_id_95]",
2062
+ "lstrip": false,
2063
+ "normalized": false,
2064
+ "rstrip": false,
2065
+ "single_word": false,
2066
+ "special": true
2067
+ },
2068
+ "258": {
2069
+ "content": "[extra_id_96]",
2070
+ "lstrip": false,
2071
+ "normalized": false,
2072
+ "rstrip": false,
2073
+ "single_word": false,
2074
+ "special": true
2075
+ },
2076
+ "259": {
2077
+ "content": "[extra_id_97]",
2078
+ "lstrip": false,
2079
+ "normalized": false,
2080
+ "rstrip": false,
2081
+ "single_word": false,
2082
+ "special": true
2083
+ },
2084
+ "260": {
2085
+ "content": "[extra_id_98]",
2086
+ "lstrip": false,
2087
+ "normalized": false,
2088
+ "rstrip": false,
2089
+ "single_word": false,
2090
+ "special": true
2091
+ },
2092
+ "261": {
2093
+ "content": "[extra_id_99]",
2094
+ "lstrip": false,
2095
+ "normalized": false,
2096
+ "rstrip": false,
2097
+ "single_word": false,
2098
+ "special": true
2099
+ },
2100
+ "262": {
2101
+ "content": "[extra_id_100]",
2102
+ "lstrip": false,
2103
+ "normalized": false,
2104
+ "rstrip": false,
2105
+ "single_word": false,
2106
+ "special": true
2107
+ },
2108
+ "263": {
2109
+ "content": "[extra_id_101]",
2110
+ "lstrip": false,
2111
+ "normalized": false,
2112
+ "rstrip": false,
2113
+ "single_word": false,
2114
+ "special": true
2115
+ },
2116
+ "264": {
2117
+ "content": "[extra_id_102]",
2118
+ "lstrip": false,
2119
+ "normalized": false,
2120
+ "rstrip": false,
2121
+ "single_word": false,
2122
+ "special": true
2123
+ },
2124
+ "265": {
2125
+ "content": "[extra_id_103]",
2126
+ "lstrip": false,
2127
+ "normalized": false,
2128
+ "rstrip": false,
2129
+ "single_word": false,
2130
+ "special": true
2131
+ },
2132
+ "266": {
2133
+ "content": "[extra_id_104]",
2134
+ "lstrip": false,
2135
+ "normalized": false,
2136
+ "rstrip": false,
2137
+ "single_word": false,
2138
+ "special": true
2139
+ },
2140
+ "267": {
2141
+ "content": "[extra_id_105]",
2142
+ "lstrip": false,
2143
+ "normalized": false,
2144
+ "rstrip": false,
2145
+ "single_word": false,
2146
+ "special": true
2147
+ },
2148
+ "268": {
2149
+ "content": "[extra_id_106]",
2150
+ "lstrip": false,
2151
+ "normalized": false,
2152
+ "rstrip": false,
2153
+ "single_word": false,
2154
+ "special": true
2155
+ },
2156
+ "269": {
2157
+ "content": "[extra_id_107]",
2158
+ "lstrip": false,
2159
+ "normalized": false,
2160
+ "rstrip": false,
2161
+ "single_word": false,
2162
+ "special": true
2163
+ },
2164
+ "270": {
2165
+ "content": "[extra_id_108]",
2166
+ "lstrip": false,
2167
+ "normalized": false,
2168
+ "rstrip": false,
2169
+ "single_word": false,
2170
+ "special": true
2171
+ },
2172
+ "271": {
2173
+ "content": "[extra_id_109]",
2174
+ "lstrip": false,
2175
+ "normalized": false,
2176
+ "rstrip": false,
2177
+ "single_word": false,
2178
+ "special": true
2179
+ },
2180
+ "272": {
2181
+ "content": "[extra_id_110]",
2182
+ "lstrip": false,
2183
+ "normalized": false,
2184
+ "rstrip": false,
2185
+ "single_word": false,
2186
+ "special": true
2187
+ },
2188
+ "273": {
2189
+ "content": "[extra_id_111]",
2190
+ "lstrip": false,
2191
+ "normalized": false,
2192
+ "rstrip": false,
2193
+ "single_word": false,
2194
+ "special": true
2195
+ },
2196
+ "274": {
2197
+ "content": "[extra_id_112]",
2198
+ "lstrip": false,
2199
+ "normalized": false,
2200
+ "rstrip": false,
2201
+ "single_word": false,
2202
+ "special": true
2203
+ },
2204
+ "275": {
2205
+ "content": "[extra_id_113]",
2206
+ "lstrip": false,
2207
+ "normalized": false,
2208
+ "rstrip": false,
2209
+ "single_word": false,
2210
+ "special": true
2211
+ },
2212
+ "276": {
2213
+ "content": "[extra_id_114]",
2214
+ "lstrip": false,
2215
+ "normalized": false,
2216
+ "rstrip": false,
2217
+ "single_word": false,
2218
+ "special": true
2219
+ },
2220
+ "277": {
2221
+ "content": "[extra_id_115]",
2222
+ "lstrip": false,
2223
+ "normalized": false,
2224
+ "rstrip": false,
2225
+ "single_word": false,
2226
+ "special": true
2227
+ },
2228
+ "278": {
2229
+ "content": "[extra_id_116]",
2230
+ "lstrip": false,
2231
+ "normalized": false,
2232
+ "rstrip": false,
2233
+ "single_word": false,
2234
+ "special": true
2235
+ },
2236
+ "279": {
2237
+ "content": "[extra_id_117]",
2238
+ "lstrip": false,
2239
+ "normalized": false,
2240
+ "rstrip": false,
2241
+ "single_word": false,
2242
+ "special": true
2243
+ },
2244
+ "280": {
2245
+ "content": "[extra_id_118]",
2246
+ "lstrip": false,
2247
+ "normalized": false,
2248
+ "rstrip": false,
2249
+ "single_word": false,
2250
+ "special": true
2251
+ },
2252
+ "281": {
2253
+ "content": "[extra_id_119]",
2254
+ "lstrip": false,
2255
+ "normalized": false,
2256
+ "rstrip": false,
2257
+ "single_word": false,
2258
+ "special": true
2259
+ },
2260
+ "282": {
2261
+ "content": "[extra_id_120]",
2262
+ "lstrip": false,
2263
+ "normalized": false,
2264
+ "rstrip": false,
2265
+ "single_word": false,
2266
+ "special": true
2267
+ },
2268
+ "283": {
2269
+ "content": "[extra_id_121]",
2270
+ "lstrip": false,
2271
+ "normalized": false,
2272
+ "rstrip": false,
2273
+ "single_word": false,
2274
+ "special": true
2275
+ },
2276
+ "284": {
2277
+ "content": "[extra_id_122]",
2278
+ "lstrip": false,
2279
+ "normalized": false,
2280
+ "rstrip": false,
2281
+ "single_word": false,
2282
+ "special": true
2283
+ },
2284
+ "285": {
2285
+ "content": "[extra_id_123]",
2286
+ "lstrip": false,
2287
+ "normalized": false,
2288
+ "rstrip": false,
2289
+ "single_word": false,
2290
+ "special": true
2291
+ },
2292
+ "286": {
2293
+ "content": "[extra_id_124]",
2294
+ "lstrip": false,
2295
+ "normalized": false,
2296
+ "rstrip": false,
2297
+ "single_word": false,
2298
+ "special": true
2299
+ },
2300
+ "287": {
2301
+ "content": "[extra_id_125]",
2302
+ "lstrip": false,
2303
+ "normalized": false,
2304
+ "rstrip": false,
2305
+ "single_word": false,
2306
+ "special": true
2307
+ },
2308
+ "288": {
2309
+ "content": "[extra_id_126]",
2310
+ "lstrip": false,
2311
+ "normalized": false,
2312
+ "rstrip": false,
2313
+ "single_word": false,
2314
+ "special": true
2315
+ },
2316
+ "289": {
2317
+ "content": "[extra_id_127]",
2318
+ "lstrip": false,
2319
+ "normalized": false,
2320
+ "rstrip": false,
2321
+ "single_word": false,
2322
+ "special": true
2323
+ },
2324
+ "290": {
2325
+ "content": "[extra_id_128]",
2326
+ "lstrip": false,
2327
+ "normalized": false,
2328
+ "rstrip": false,
2329
+ "single_word": false,
2330
+ "special": true
2331
+ },
2332
+ "291": {
2333
+ "content": "[extra_id_129]",
2334
+ "lstrip": false,
2335
+ "normalized": false,
2336
+ "rstrip": false,
2337
+ "single_word": false,
2338
+ "special": true
2339
+ },
2340
+ "292": {
2341
+ "content": "[extra_id_130]",
2342
+ "lstrip": false,
2343
+ "normalized": false,
2344
+ "rstrip": false,
2345
+ "single_word": false,
2346
+ "special": true
2347
+ },
2348
+ "293": {
2349
+ "content": "[extra_id_131]",
2350
+ "lstrip": false,
2351
+ "normalized": false,
2352
+ "rstrip": false,
2353
+ "single_word": false,
2354
+ "special": true
2355
+ },
2356
+ "294": {
2357
+ "content": "[extra_id_132]",
2358
+ "lstrip": false,
2359
+ "normalized": false,
2360
+ "rstrip": false,
2361
+ "single_word": false,
2362
+ "special": true
2363
+ },
2364
+ "295": {
2365
+ "content": "[extra_id_133]",
2366
+ "lstrip": false,
2367
+ "normalized": false,
2368
+ "rstrip": false,
2369
+ "single_word": false,
2370
+ "special": true
2371
+ },
2372
+ "296": {
2373
+ "content": "[extra_id_134]",
2374
+ "lstrip": false,
2375
+ "normalized": false,
2376
+ "rstrip": false,
2377
+ "single_word": false,
2378
+ "special": true
2379
+ },
2380
+ "297": {
2381
+ "content": "[extra_id_135]",
2382
+ "lstrip": false,
2383
+ "normalized": false,
2384
+ "rstrip": false,
2385
+ "single_word": false,
2386
+ "special": true
2387
+ },
2388
+ "298": {
2389
+ "content": "[extra_id_136]",
2390
+ "lstrip": false,
2391
+ "normalized": false,
2392
+ "rstrip": false,
2393
+ "single_word": false,
2394
+ "special": true
2395
+ },
2396
+ "299": {
2397
+ "content": "[extra_id_137]",
2398
+ "lstrip": false,
2399
+ "normalized": false,
2400
+ "rstrip": false,
2401
+ "single_word": false,
2402
+ "special": true
2403
+ },
2404
+ "300": {
2405
+ "content": "[extra_id_138]",
2406
+ "lstrip": false,
2407
+ "normalized": false,
2408
+ "rstrip": false,
2409
+ "single_word": false,
2410
+ "special": true
2411
+ },
2412
+ "301": {
2413
+ "content": "[extra_id_139]",
2414
+ "lstrip": false,
2415
+ "normalized": false,
2416
+ "rstrip": false,
2417
+ "single_word": false,
2418
+ "special": true
2419
+ },
2420
+ "302": {
2421
+ "content": "[extra_id_140]",
2422
+ "lstrip": false,
2423
+ "normalized": false,
2424
+ "rstrip": false,
2425
+ "single_word": false,
2426
+ "special": true
2427
+ },
2428
+ "303": {
2429
+ "content": "[extra_id_141]",
2430
+ "lstrip": false,
2431
+ "normalized": false,
2432
+ "rstrip": false,
2433
+ "single_word": false,
2434
+ "special": true
2435
+ },
2436
+ "304": {
2437
+ "content": "[extra_id_142]",
2438
+ "lstrip": false,
2439
+ "normalized": false,
2440
+ "rstrip": false,
2441
+ "single_word": false,
2442
+ "special": true
2443
+ },
2444
+ "305": {
2445
+ "content": "[extra_id_143]",
2446
+ "lstrip": false,
2447
+ "normalized": false,
2448
+ "rstrip": false,
2449
+ "single_word": false,
2450
+ "special": true
2451
+ },
2452
+ "306": {
2453
+ "content": "[extra_id_144]",
2454
+ "lstrip": false,
2455
+ "normalized": false,
2456
+ "rstrip": false,
2457
+ "single_word": false,
2458
+ "special": true
2459
+ },
2460
+ "307": {
2461
+ "content": "[extra_id_145]",
2462
+ "lstrip": false,
2463
+ "normalized": false,
2464
+ "rstrip": false,
2465
+ "single_word": false,
2466
+ "special": true
2467
+ },
2468
+ "308": {
2469
+ "content": "[extra_id_146]",
2470
+ "lstrip": false,
2471
+ "normalized": false,
2472
+ "rstrip": false,
2473
+ "single_word": false,
2474
+ "special": true
2475
+ },
2476
+ "309": {
2477
+ "content": "[extra_id_147]",
2478
+ "lstrip": false,
2479
+ "normalized": false,
2480
+ "rstrip": false,
2481
+ "single_word": false,
2482
+ "special": true
2483
+ },
2484
+ "310": {
2485
+ "content": "[extra_id_148]",
2486
+ "lstrip": false,
2487
+ "normalized": false,
2488
+ "rstrip": false,
2489
+ "single_word": false,
2490
+ "special": true
2491
+ },
2492
+ "311": {
2493
+ "content": "[extra_id_149]",
2494
+ "lstrip": false,
2495
+ "normalized": false,
2496
+ "rstrip": false,
2497
+ "single_word": false,
2498
+ "special": true
2499
+ },
2500
+ "312": {
2501
+ "content": "[extra_id_150]",
2502
+ "lstrip": false,
2503
+ "normalized": false,
2504
+ "rstrip": false,
2505
+ "single_word": false,
2506
+ "special": true
2507
+ },
2508
+ "313": {
2509
+ "content": "[extra_id_151]",
2510
+ "lstrip": false,
2511
+ "normalized": false,
2512
+ "rstrip": false,
2513
+ "single_word": false,
2514
+ "special": true
2515
+ },
2516
+ "314": {
2517
+ "content": "[extra_id_152]",
2518
+ "lstrip": false,
2519
+ "normalized": false,
2520
+ "rstrip": false,
2521
+ "single_word": false,
2522
+ "special": true
2523
+ },
2524
+ "315": {
2525
+ "content": "[extra_id_153]",
2526
+ "lstrip": false,
2527
+ "normalized": false,
2528
+ "rstrip": false,
2529
+ "single_word": false,
2530
+ "special": true
2531
+ },
2532
+ "316": {
2533
+ "content": "[extra_id_154]",
2534
+ "lstrip": false,
2535
+ "normalized": false,
2536
+ "rstrip": false,
2537
+ "single_word": false,
2538
+ "special": true
2539
+ },
2540
+ "317": {
2541
+ "content": "[extra_id_155]",
2542
+ "lstrip": false,
2543
+ "normalized": false,
2544
+ "rstrip": false,
2545
+ "single_word": false,
2546
+ "special": true
2547
+ },
2548
+ "318": {
2549
+ "content": "[extra_id_156]",
2550
+ "lstrip": false,
2551
+ "normalized": false,
2552
+ "rstrip": false,
2553
+ "single_word": false,
2554
+ "special": true
2555
+ },
2556
+ "319": {
2557
+ "content": "[extra_id_157]",
2558
+ "lstrip": false,
2559
+ "normalized": false,
2560
+ "rstrip": false,
2561
+ "single_word": false,
2562
+ "special": true
2563
+ },
2564
+ "320": {
2565
+ "content": "[extra_id_158]",
2566
+ "lstrip": false,
2567
+ "normalized": false,
2568
+ "rstrip": false,
2569
+ "single_word": false,
2570
+ "special": true
2571
+ },
2572
+ "321": {
2573
+ "content": "[extra_id_159]",
2574
+ "lstrip": false,
2575
+ "normalized": false,
2576
+ "rstrip": false,
2577
+ "single_word": false,
2578
+ "special": true
2579
+ },
2580
+ "322": {
2581
+ "content": "[extra_id_160]",
2582
+ "lstrip": false,
2583
+ "normalized": false,
2584
+ "rstrip": false,
2585
+ "single_word": false,
2586
+ "special": true
2587
+ },
2588
+ "323": {
2589
+ "content": "[extra_id_161]",
2590
+ "lstrip": false,
2591
+ "normalized": false,
2592
+ "rstrip": false,
2593
+ "single_word": false,
2594
+ "special": true
2595
+ },
2596
+ "324": {
2597
+ "content": "[extra_id_162]",
2598
+ "lstrip": false,
2599
+ "normalized": false,
2600
+ "rstrip": false,
2601
+ "single_word": false,
2602
+ "special": true
2603
+ },
2604
+ "325": {
2605
+ "content": "[extra_id_163]",
2606
+ "lstrip": false,
2607
+ "normalized": false,
2608
+ "rstrip": false,
2609
+ "single_word": false,
2610
+ "special": true
2611
+ },
2612
+ "326": {
2613
+ "content": "[extra_id_164]",
2614
+ "lstrip": false,
2615
+ "normalized": false,
2616
+ "rstrip": false,
2617
+ "single_word": false,
2618
+ "special": true
2619
+ },
2620
+ "327": {
2621
+ "content": "[extra_id_165]",
2622
+ "lstrip": false,
2623
+ "normalized": false,
2624
+ "rstrip": false,
2625
+ "single_word": false,
2626
+ "special": true
2627
+ },
2628
+ "328": {
2629
+ "content": "[extra_id_166]",
2630
+ "lstrip": false,
2631
+ "normalized": false,
2632
+ "rstrip": false,
2633
+ "single_word": false,
2634
+ "special": true
2635
+ },
2636
+ "329": {
2637
+ "content": "[extra_id_167]",
2638
+ "lstrip": false,
2639
+ "normalized": false,
2640
+ "rstrip": false,
2641
+ "single_word": false,
2642
+ "special": true
2643
+ },
2644
+ "330": {
2645
+ "content": "[extra_id_168]",
2646
+ "lstrip": false,
2647
+ "normalized": false,
2648
+ "rstrip": false,
2649
+ "single_word": false,
2650
+ "special": true
2651
+ },
2652
+ "331": {
2653
+ "content": "[extra_id_169]",
2654
+ "lstrip": false,
2655
+ "normalized": false,
2656
+ "rstrip": false,
2657
+ "single_word": false,
2658
+ "special": true
2659
+ },
2660
+ "332": {
2661
+ "content": "[extra_id_170]",
2662
+ "lstrip": false,
2663
+ "normalized": false,
2664
+ "rstrip": false,
2665
+ "single_word": false,
2666
+ "special": true
2667
+ },
2668
+ "333": {
2669
+ "content": "[extra_id_171]",
2670
+ "lstrip": false,
2671
+ "normalized": false,
2672
+ "rstrip": false,
2673
+ "single_word": false,
2674
+ "special": true
2675
+ },
2676
+ "334": {
2677
+ "content": "[extra_id_172]",
2678
+ "lstrip": false,
2679
+ "normalized": false,
2680
+ "rstrip": false,
2681
+ "single_word": false,
2682
+ "special": true
2683
+ },
2684
+ "335": {
2685
+ "content": "[extra_id_173]",
2686
+ "lstrip": false,
2687
+ "normalized": false,
2688
+ "rstrip": false,
2689
+ "single_word": false,
2690
+ "special": true
2691
+ },
2692
+ "336": {
2693
+ "content": "[extra_id_174]",
2694
+ "lstrip": false,
2695
+ "normalized": false,
2696
+ "rstrip": false,
2697
+ "single_word": false,
2698
+ "special": true
2699
+ },
2700
+ "337": {
2701
+ "content": "[extra_id_175]",
2702
+ "lstrip": false,
2703
+ "normalized": false,
2704
+ "rstrip": false,
2705
+ "single_word": false,
2706
+ "special": true
2707
+ },
2708
+ "338": {
2709
+ "content": "[extra_id_176]",
2710
+ "lstrip": false,
2711
+ "normalized": false,
2712
+ "rstrip": false,
2713
+ "single_word": false,
2714
+ "special": true
2715
+ },
2716
+ "339": {
2717
+ "content": "[extra_id_177]",
2718
+ "lstrip": false,
2719
+ "normalized": false,
2720
+ "rstrip": false,
2721
+ "single_word": false,
2722
+ "special": true
2723
+ },
2724
+ "340": {
2725
+ "content": "[extra_id_178]",
2726
+ "lstrip": false,
2727
+ "normalized": false,
2728
+ "rstrip": false,
2729
+ "single_word": false,
2730
+ "special": true
2731
+ },
2732
+ "341": {
2733
+ "content": "[extra_id_179]",
2734
+ "lstrip": false,
2735
+ "normalized": false,
2736
+ "rstrip": false,
2737
+ "single_word": false,
2738
+ "special": true
2739
+ },
2740
+ "342": {
2741
+ "content": "[extra_id_180]",
2742
+ "lstrip": false,
2743
+ "normalized": false,
2744
+ "rstrip": false,
2745
+ "single_word": false,
2746
+ "special": true
2747
+ },
2748
+ "343": {
2749
+ "content": "[extra_id_181]",
2750
+ "lstrip": false,
2751
+ "normalized": false,
2752
+ "rstrip": false,
2753
+ "single_word": false,
2754
+ "special": true
2755
+ },
2756
+ "344": {
2757
+ "content": "[extra_id_182]",
2758
+ "lstrip": false,
2759
+ "normalized": false,
2760
+ "rstrip": false,
2761
+ "single_word": false,
2762
+ "special": true
2763
+ },
2764
+ "345": {
2765
+ "content": "[extra_id_183]",
2766
+ "lstrip": false,
2767
+ "normalized": false,
2768
+ "rstrip": false,
2769
+ "single_word": false,
2770
+ "special": true
2771
+ },
2772
+ "346": {
2773
+ "content": "[extra_id_184]",
2774
+ "lstrip": false,
2775
+ "normalized": false,
2776
+ "rstrip": false,
2777
+ "single_word": false,
2778
+ "special": true
2779
+ },
2780
+ "347": {
2781
+ "content": "[extra_id_185]",
2782
+ "lstrip": false,
2783
+ "normalized": false,
2784
+ "rstrip": false,
2785
+ "single_word": false,
2786
+ "special": true
2787
+ },
2788
+ "348": {
2789
+ "content": "[extra_id_186]",
2790
+ "lstrip": false,
2791
+ "normalized": false,
2792
+ "rstrip": false,
2793
+ "single_word": false,
2794
+ "special": true
2795
+ },
2796
+ "349": {
2797
+ "content": "[extra_id_187]",
2798
+ "lstrip": false,
2799
+ "normalized": false,
2800
+ "rstrip": false,
2801
+ "single_word": false,
2802
+ "special": true
2803
+ },
2804
+ "350": {
2805
+ "content": "[extra_id_188]",
2806
+ "lstrip": false,
2807
+ "normalized": false,
2808
+ "rstrip": false,
2809
+ "single_word": false,
2810
+ "special": true
2811
+ },
2812
+ "351": {
2813
+ "content": "[extra_id_189]",
2814
+ "lstrip": false,
2815
+ "normalized": false,
2816
+ "rstrip": false,
2817
+ "single_word": false,
2818
+ "special": true
2819
+ },
2820
+ "352": {
2821
+ "content": "[extra_id_190]",
2822
+ "lstrip": false,
2823
+ "normalized": false,
2824
+ "rstrip": false,
2825
+ "single_word": false,
2826
+ "special": true
2827
+ },
2828
+ "353": {
2829
+ "content": "[extra_id_191]",
2830
+ "lstrip": false,
2831
+ "normalized": false,
2832
+ "rstrip": false,
2833
+ "single_word": false,
2834
+ "special": true
2835
+ },
2836
+ "354": {
2837
+ "content": "[extra_id_192]",
2838
+ "lstrip": false,
2839
+ "normalized": false,
2840
+ "rstrip": false,
2841
+ "single_word": false,
2842
+ "special": true
2843
+ },
2844
+ "355": {
2845
+ "content": "[extra_id_193]",
2846
+ "lstrip": false,
2847
+ "normalized": false,
2848
+ "rstrip": false,
2849
+ "single_word": false,
2850
+ "special": true
2851
+ },
2852
+ "356": {
2853
+ "content": "[extra_id_194]",
2854
+ "lstrip": false,
2855
+ "normalized": false,
2856
+ "rstrip": false,
2857
+ "single_word": false,
2858
+ "special": true
2859
+ },
2860
+ "357": {
2861
+ "content": "[extra_id_195]",
2862
+ "lstrip": false,
2863
+ "normalized": false,
2864
+ "rstrip": false,
2865
+ "single_word": false,
2866
+ "special": true
2867
+ },
2868
+ "358": {
2869
+ "content": "[extra_id_196]",
2870
+ "lstrip": false,
2871
+ "normalized": false,
2872
+ "rstrip": false,
2873
+ "single_word": false,
2874
+ "special": true
2875
+ },
2876
+ "359": {
2877
+ "content": "[extra_id_197]",
2878
+ "lstrip": false,
2879
+ "normalized": false,
2880
+ "rstrip": false,
2881
+ "single_word": false,
2882
+ "special": true
2883
+ },
2884
+ "360": {
2885
+ "content": "[extra_id_198]",
2886
+ "lstrip": false,
2887
+ "normalized": false,
2888
+ "rstrip": false,
2889
+ "single_word": false,
2890
+ "special": true
2891
+ },
2892
+ "361": {
2893
+ "content": "[|endofturn|]",
2894
+ "lstrip": false,
2895
+ "normalized": false,
2896
+ "rstrip": false,
2897
+ "single_word": false,
2898
+ "special": true
2899
+ }
2900
+ },
2901
+ "additional_special_token": [
2902
+ "[unused0]",
2903
+ "[unused1]",
2904
+ "[unused2]",
2905
+ "[unused3]",
2906
+ "[unused4]",
2907
+ "[unused5]",
2908
+ "[unused6]",
2909
+ "[unused7]",
2910
+ "[unused8]",
2911
+ "[unused9]",
2912
+ "[unused10]",
2913
+ "[unused11]",
2914
+ "[unused12]",
2915
+ "[unused13]",
2916
+ "[unused14]",
2917
+ "[unused15]",
2918
+ "[unused16]",
2919
+ "[unused17]",
2920
+ "[unused18]",
2921
+ "[unused19]",
2922
+ "[unused20]",
2923
+ "[unused21]",
2924
+ "[unused22]",
2925
+ "[unused23]",
2926
+ "[unused24]",
2927
+ "[unused25]",
2928
+ "[unused26]",
2929
+ "[unused27]",
2930
+ "[unused28]",
2931
+ "[unused29]",
2932
+ "[unused30]",
2933
+ "[unused31]",
2934
+ "[unused32]",
2935
+ "[unused33]",
2936
+ "[unused34]",
2937
+ "[unused35]",
2938
+ "[unused36]",
2939
+ "[unused37]",
2940
+ "[unused38]",
2941
+ "[unused39]",
2942
+ "[unused40]",
2943
+ "[unused41]",
2944
+ "[unused42]",
2945
+ "[unused43]",
2946
+ "[unused44]",
2947
+ "[unused45]",
2948
+ "[unused46]",
2949
+ "[unused47]",
2950
+ "[unused48]",
2951
+ "[unused49]",
2952
+ "[unused50]",
2953
+ "[unused51]",
2954
+ "[unused52]",
2955
+ "[unused53]",
2956
+ "[unused54]",
2957
+ "[unused55]",
2958
+ "[unused56]",
2959
+ "[unused57]",
2960
+ "[unused58]",
2961
+ "[unused59]",
2962
+ "[unused60]",
2963
+ "[unused61]",
2964
+ "[unused62]",
2965
+ "[unused63]",
2966
+ "[unused64]",
2967
+ "[unused65]",
2968
+ "[unused66]",
2969
+ "[unused67]",
2970
+ "[unused68]",
2971
+ "[unused69]",
2972
+ "[unused70]",
2973
+ "[unused71]",
2974
+ "[unused72]",
2975
+ "[unused73]",
2976
+ "[unused74]",
2977
+ "[unused75]",
2978
+ "[unused76]",
2979
+ "[unused77]",
2980
+ "[unused78]",
2981
+ "[unused79]",
2982
+ "[unused80]",
2983
+ "[unused81]",
2984
+ "[unused82]",
2985
+ "[unused83]",
2986
+ "[unused84]",
2987
+ "[unused85]",
2988
+ "[unused86]",
2989
+ "[unused87]",
2990
+ "[unused88]",
2991
+ "[unused89]",
2992
+ "[unused90]",
2993
+ "[unused91]",
2994
+ "[unused92]",
2995
+ "[unused93]",
2996
+ "[unused94]",
2997
+ "[unused95]",
2998
+ "[unused96]",
2999
+ "[unused97]",
3000
+ "[unused98]",
3001
+ "[unused99]",
3002
+ "[extra_id_0]",
3003
+ "[extra_id_1]",
3004
+ "[extra_id_2]",
3005
+ "[extra_id_3]",
3006
+ "[extra_id_4]",
3007
+ "[extra_id_5]",
3008
+ "[extra_id_6]",
3009
+ "[extra_id_7]",
3010
+ "[extra_id_8]",
3011
+ "[extra_id_9]",
3012
+ "[extra_id_10]",
3013
+ "[extra_id_11]",
3014
+ "[extra_id_12]",
3015
+ "[extra_id_13]",
3016
+ "[extra_id_14]",
3017
+ "[extra_id_15]",
3018
+ "[extra_id_16]",
3019
+ "[extra_id_17]",
3020
+ "[extra_id_18]",
3021
+ "[extra_id_19]",
3022
+ "[extra_id_20]",
3023
+ "[extra_id_21]",
3024
+ "[extra_id_22]",
3025
+ "[extra_id_23]",
3026
+ "[extra_id_24]",
3027
+ "[extra_id_25]",
3028
+ "[extra_id_26]",
3029
+ "[extra_id_27]",
3030
+ "[extra_id_28]",
3031
+ "[extra_id_29]",
3032
+ "[extra_id_30]",
3033
+ "[extra_id_31]",
3034
+ "[extra_id_32]",
3035
+ "[extra_id_33]",
3036
+ "[extra_id_34]",
3037
+ "[extra_id_35]",
3038
+ "[extra_id_36]",
3039
+ "[extra_id_37]",
3040
+ "[extra_id_38]",
3041
+ "[extra_id_39]",
3042
+ "[extra_id_40]",
3043
+ "[extra_id_41]",
3044
+ "[extra_id_42]",
3045
+ "[extra_id_43]",
3046
+ "[extra_id_44]",
3047
+ "[extra_id_45]",
3048
+ "[extra_id_46]",
3049
+ "[extra_id_47]",
3050
+ "[extra_id_48]",
3051
+ "[extra_id_49]",
3052
+ "[extra_id_50]",
3053
+ "[extra_id_51]",
3054
+ "[extra_id_52]",
3055
+ "[extra_id_53]",
3056
+ "[extra_id_54]",
3057
+ "[extra_id_55]",
3058
+ "[extra_id_56]",
3059
+ "[extra_id_57]",
3060
+ "[extra_id_58]",
3061
+ "[extra_id_59]",
3062
+ "[extra_id_60]",
3063
+ "[extra_id_61]",
3064
+ "[extra_id_62]",
3065
+ "[extra_id_63]",
3066
+ "[extra_id_64]",
3067
+ "[extra_id_65]",
3068
+ "[extra_id_66]",
3069
+ "[extra_id_67]",
3070
+ "[extra_id_68]",
3071
+ "[extra_id_69]",
3072
+ "[extra_id_70]",
3073
+ "[extra_id_71]",
3074
+ "[extra_id_72]",
3075
+ "[extra_id_73]",
3076
+ "[extra_id_74]",
3077
+ "[extra_id_75]",
3078
+ "[extra_id_76]",
3079
+ "[extra_id_77]",
3080
+ "[extra_id_78]",
3081
+ "[extra_id_79]",
3082
+ "[extra_id_80]",
3083
+ "[extra_id_81]",
3084
+ "[extra_id_82]",
3085
+ "[extra_id_83]",
3086
+ "[extra_id_84]",
3087
+ "[extra_id_85]",
3088
+ "[extra_id_86]",
3089
+ "[extra_id_87]",
3090
+ "[extra_id_88]",
3091
+ "[extra_id_89]",
3092
+ "[extra_id_90]",
3093
+ "[extra_id_91]",
3094
+ "[extra_id_92]",
3095
+ "[extra_id_93]",
3096
+ "[extra_id_94]",
3097
+ "[extra_id_95]",
3098
+ "[extra_id_96]",
3099
+ "[extra_id_97]",
3100
+ "[extra_id_98]",
3101
+ "[extra_id_99]",
3102
+ "[extra_id_100]",
3103
+ "[extra_id_101]",
3104
+ "[extra_id_102]",
3105
+ "[extra_id_103]",
3106
+ "[extra_id_104]",
3107
+ "[extra_id_105]",
3108
+ "[extra_id_106]",
3109
+ "[extra_id_107]",
3110
+ "[extra_id_108]",
3111
+ "[extra_id_109]",
3112
+ "[extra_id_110]",
3113
+ "[extra_id_111]",
3114
+ "[extra_id_112]",
3115
+ "[extra_id_113]",
3116
+ "[extra_id_114]",
3117
+ "[extra_id_115]",
3118
+ "[extra_id_116]",
3119
+ "[extra_id_117]",
3120
+ "[extra_id_118]",
3121
+ "[extra_id_119]",
3122
+ "[extra_id_120]",
3123
+ "[extra_id_121]",
3124
+ "[extra_id_122]",
3125
+ "[extra_id_123]",
3126
+ "[extra_id_124]",
3127
+ "[extra_id_125]",
3128
+ "[extra_id_126]",
3129
+ "[extra_id_127]",
3130
+ "[extra_id_128]",
3131
+ "[extra_id_129]",
3132
+ "[extra_id_130]",
3133
+ "[extra_id_131]",
3134
+ "[extra_id_132]",
3135
+ "[extra_id_133]",
3136
+ "[extra_id_134]",
3137
+ "[extra_id_135]",
3138
+ "[extra_id_136]",
3139
+ "[extra_id_137]",
3140
+ "[extra_id_138]",
3141
+ "[extra_id_139]",
3142
+ "[extra_id_140]",
3143
+ "[extra_id_141]",
3144
+ "[extra_id_142]",
3145
+ "[extra_id_143]",
3146
+ "[extra_id_144]",
3147
+ "[extra_id_145]",
3148
+ "[extra_id_146]",
3149
+ "[extra_id_147]",
3150
+ "[extra_id_148]",
3151
+ "[extra_id_149]",
3152
+ "[extra_id_150]",
3153
+ "[extra_id_151]",
3154
+ "[extra_id_152]",
3155
+ "[extra_id_153]",
3156
+ "[extra_id_154]",
3157
+ "[extra_id_155]",
3158
+ "[extra_id_156]",
3159
+ "[extra_id_157]",
3160
+ "[extra_id_158]",
3161
+ "[extra_id_159]",
3162
+ "[extra_id_160]",
3163
+ "[extra_id_161]",
3164
+ "[extra_id_162]",
3165
+ "[extra_id_163]",
3166
+ "[extra_id_164]",
3167
+ "[extra_id_165]",
3168
+ "[extra_id_166]",
3169
+ "[extra_id_167]",
3170
+ "[extra_id_168]",
3171
+ "[extra_id_169]",
3172
+ "[extra_id_170]",
3173
+ "[extra_id_171]",
3174
+ "[extra_id_172]",
3175
+ "[extra_id_173]",
3176
+ "[extra_id_174]",
3177
+ "[extra_id_175]",
3178
+ "[extra_id_176]",
3179
+ "[extra_id_177]",
3180
+ "[extra_id_178]",
3181
+ "[extra_id_179]",
3182
+ "[extra_id_180]",
3183
+ "[extra_id_181]",
3184
+ "[extra_id_182]",
3185
+ "[extra_id_183]",
3186
+ "[extra_id_184]",
3187
+ "[extra_id_185]",
3188
+ "[extra_id_186]",
3189
+ "[extra_id_187]",
3190
+ "[extra_id_188]",
3191
+ "[extra_id_189]",
3192
+ "[extra_id_190]",
3193
+ "[extra_id_191]",
3194
+ "[extra_id_192]",
3195
+ "[extra_id_193]",
3196
+ "[extra_id_194]",
3197
+ "[extra_id_195]",
3198
+ "[extra_id_196]",
3199
+ "[extra_id_197]",
3200
+ "[extra_id_198]",
3201
+ "[|endofturn|]",
3202
+ "PI:URL",
3203
+ "PI:EMAIL",
3204
+ "PI:ACCOUNT_NUM",
3205
+ "PI:PHONE_NUM",
3206
+ "PI:BUSINESS_NUM",
3207
+ "PI:ANNON",
3208
+ "PI:KEY",
3209
+ "PI:ID",
3210
+ "PI:IP_ADDRESS",
3211
+ "PI:USER"
3212
+ ],
3213
+ "bos_token": "[BOS]",
3214
+ "chat_template": "{% for message in messages %}{% if loop.first and message['role'] != 'system' %}{{ '[|system|][|endofturn|]\n' }}{% endif %}{% set content = message['content'] %}{% if '</thought>' in content %}{% set content = content.split('</thought>')[-1].lstrip('\\n') %}{% endif %}{{ '[|' + message['role'] + '|]' + content }}{% if not message['role'] == 'user' %}{{ '[|endofturn|]' }}{% endif %}{% if not loop.last %}{{ '\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '\n[|assistant|]<thought>\n' }}{% endif %}",
3215
+ "clean_up_tokenization_spaces": true,
3216
+ "eos_token": "[|endofturn|]",
3217
+ "extra_special_tokens": {},
3218
+ "model_max_length": 1000000000000000019884624838656,
3219
+ "pad_token": "[PAD]",
3220
+ "tokenizer_class": "GPT2Tokenizer",
3221
+ "unk_token": "[UNK]"
3222
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff