AdoCleanCode commited on
Commit
68e4ddb
·
verified ·
1 Parent(s): 3bb3a41

Auto-upload tokenizer after eval at step 500

Browse files
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
37
+ tokenizer_config.json filter=lfs diff=lfs merge=lfs -text
chat_template.jinja ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {{- bos_token }}
2
+ {%- if custom_tools is defined %}
3
+ {%- set tools = custom_tools %}
4
+ {%- endif %}
5
+ {%- if not tools_in_user_message is defined %}
6
+ {%- set tools_in_user_message = true %}
7
+ {%- endif %}
8
+ {%- if not date_string is defined %}
9
+ {%- if strftime_now is defined %}
10
+ {%- set date_string = strftime_now("%d %b %Y") %}
11
+ {%- else %}
12
+ {%- set date_string = "26 Jul 2024" %}
13
+ {%- endif %}
14
+ {%- endif %}
15
+ {%- if not tools is defined %}
16
+ {%- set tools = none %}
17
+ {%- endif %}
18
+
19
+ {#- This block extracts the system message, so we can slot it into the right place. #}
20
+ {%- if messages[0]['role'] == 'system' %}
21
+ {%- set system_message = messages[0]['content']|trim %}
22
+ {%- set messages = messages[1:] %}
23
+ {%- else %}
24
+ {%- set system_message = "" %}
25
+ {%- endif %}
26
+
27
+ {#- System message #}
28
+ {{- "<|start_header_id|>system<|end_header_id|>\n\n" }}
29
+ {%- if tools is not none %}
30
+ {{- "Environment: ipython\n" }}
31
+ {%- endif %}
32
+ {{- "Cutting Knowledge Date: December 2023\n" }}
33
+ {{- "Today Date: " + date_string + "\n\n" }}
34
+ {%- if tools is not none and not tools_in_user_message %}
35
+ {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
36
+ {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
37
+ {{- "Do not use variables.\n\n" }}
38
+ {%- for t in tools %}
39
+ {{- t | tojson(indent=4) }}
40
+ {{- "\n\n" }}
41
+ {%- endfor %}
42
+ {%- endif %}
43
+ {{- system_message }}
44
+ {{- "<|eot_id|>" }}
45
+
46
+ {#- Custom tools are passed in a user message with some extra guidance #}
47
+ {%- if tools_in_user_message and not tools is none %}
48
+ {#- Extract the first user message so we can plug it in here #}
49
+ {%- if messages | length != 0 %}
50
+ {%- set first_user_message = messages[0]['content']|trim %}
51
+ {%- set messages = messages[1:] %}
52
+ {%- else %}
53
+ {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }}
54
+ {%- endif %}
55
+ {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}
56
+ {{- "Given the following functions, please respond with a JSON for a function call " }}
57
+ {{- "with its proper arguments that best answers the given prompt.\n\n" }}
58
+ {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
59
+ {{- "Do not use variables.\n\n" }}
60
+ {%- for t in tools %}
61
+ {{- t | tojson(indent=4) }}
62
+ {{- "\n\n" }}
63
+ {%- endfor %}
64
+ {{- first_user_message + "<|eot_id|>"}}
65
+ {%- endif %}
66
+
67
+ {%- for message in messages %}
68
+ {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}
69
+ {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }}
70
+ {%- elif 'tool_calls' in message %}
71
+ {%- if not message.tool_calls|length == 1 %}
72
+ {{- raise_exception("This model only supports single tool-calls at once!") }}
73
+ {%- endif %}
74
+ {%- set tool_call = message.tool_calls[0].function %}
75
+ {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}
76
+ {{- '{"name": "' + tool_call.name + '", ' }}
77
+ {{- '"parameters": ' }}
78
+ {{- tool_call.arguments | tojson }}
79
+ {{- "}" }}
80
+ {{- "<|eot_id|>" }}
81
+ {%- elif message.role == "tool" or message.role == "ipython" %}
82
+ {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }}
83
+ {%- if message.content is mapping or message.content is iterable %}
84
+ {{- message.content | tojson }}
85
+ {%- else %}
86
+ {{- message.content }}
87
+ {%- endif %}
88
+ {{- "<|eot_id|>" }}
89
+ {%- endif %}
90
+ {%- endfor %}
91
+ {%- if add_generation_prompt %}
92
+ {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}
93
+ {%- endif %}
special_tokens_map.json ADDED
@@ -0,0 +1,678 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|start_audio|>",
4
+ "<|start_of_speech|>",
5
+ "<|start_phon_gen|>",
6
+ "<|end_phon_gen|>",
7
+ "<|GENERATE_PHONEMES_FROM_TEXT|>",
8
+ "<|GENERATE_TEXT_FROM_PHONEMES|>",
9
+ "<|ph_space|>",
10
+ "<|ph_0289|>",
11
+ "<|ph_025B-02E8-02E9|>",
12
+ "<|ph_0265|>",
13
+ "<|ph_0255-02B7|>",
14
+ "<|ph_0065-02D0-02E7-02E9|>",
15
+ "<|ph_0064-032A-02D0|>",
16
+ "<|ph_0075-02D0-02E9-02E9-02E6|>",
17
+ "<|ph_0076-02D0|>",
18
+ "<|ph_0250-0303|>",
19
+ "<|ph_0259-02E5|>",
20
+ "<|ph_007A-0329-02E7-02E5|>",
21
+ "<|ph_0075-0303|>",
22
+ "<|ph_028A|>",
23
+ "<|ph_0064-0292-02D0|>",
24
+ "<|ph_0065-006A|>",
25
+ "<|ph_0278-02B2|>",
26
+ "<|ph_0079-02E9|>",
27
+ "<|ph_0061-0077-02E5-02E9|>",
28
+ "<|ph_0259-02D0-02E8-02E9-02C0|>",
29
+ "<|ph_0075-02E9-02E9-02E6|>",
30
+ "<|ph_007A|>",
31
+ "<|ph_028A-02E5-02E9|>",
32
+ "<|ph_0075-02E8-02E9-02E6|>",
33
+ "<|ph_0264-02D0-02E9-02E9-02E6|>",
34
+ "<|ph_0254-02D0-02E8-02E9-02E8|>",
35
+ "<|ph_0075-0061-02E8-02E9|>",
36
+ "<|ph_00E7|>",
37
+ "<|ph_0254-02D0-02E8-02E9-02E6|>",
38
+ "<|ph_028F-02E9|>",
39
+ "<|ph_006F-0077-02E7|>",
40
+ "<|ph_006F-02D0-02E8-02E8|>",
41
+ "<|ph_0069-0259-02E8-02C0-02E5|>",
42
+ "<|ph_0069-0061-02E5-02E9|>",
43
+ "<|ph_0279|>",
44
+ "<|ph_0255-0348|>",
45
+ "<|ph_0254-02E5-02E9|>",
46
+ "<|ph_0074-02B7|>",
47
+ "<|ph_0069-02E8-02E8|>",
48
+ "<|ph_0074-0073|>",
49
+ "<|ph_0069|>",
50
+ "<|ph_006F-02E9-02E9-02E6|>",
51
+ "<|ph_026F-02D0-02E6-02E5|>",
52
+ "<|ph_0065-02D0-02E8-02E9-02E8|>",
53
+ "<|ph_0069-0259-02E8-02E6|>",
54
+ "<|ph_025B-02D0-02E7|>",
55
+ "<|ph_0070-0348-02B2|>",
56
+ "<|ph_0073|>",
57
+ "<|ph_0079-02E5|>",
58
+ "<|ph_0290|>",
59
+ "<|ph_0288-02B2|>",
60
+ "<|ph_007A-0329-02E7|>",
61
+ "<|ph_0254-02D0-02E8-02E6|>",
62
+ "<|ph_0070-02B2-02D0|>",
63
+ "<|ph_0069-02E9|>",
64
+ "<|ph_0061-02E5-02E7|>",
65
+ "<|ph_0061-0077-02E5|>",
66
+ "<|ph_0254-02D0-02E7|>",
67
+ "<|ph_006B-0348-02D0|>",
68
+ "<|ph_006F-02E8-02C0-02E5|>",
69
+ "<|ph_0268-02D0|>",
70
+ "<|ph_0073-0070-006E|>",
71
+ "<|ph_0066-02B2-02D0|>",
72
+ "<|ph_0259-0077|>",
73
+ "<|ph_0259-02E8-02E9-02E6|>",
74
+ "<|ph_0275-02E5-02E7|>",
75
+ "<|ph_0252-02D0|>",
76
+ "<|ph_007A-0329-02E8-02E9-02E6|>",
77
+ "<|ph_006F-0077-02E7-02E5|>",
78
+ "<|ph_0268-02E6-02E5|>",
79
+ "<|ph_026F-02E9-02E9-02E6|>",
80
+ "<|ph_0070-031A|>",
81
+ "<|ph_006B-02D0|>",
82
+ "<|ph_025F-02B7|>",
83
+ "<|ph_0251-02D0-02E9|>",
84
+ "<|ph_0275-02E9|>",
85
+ "<|ph_0064-02B2|>",
86
+ "<|ph_0261-02D0|>",
87
+ "<|ph_028E|>",
88
+ "<|ph_0073-0348-02B7|>",
89
+ "<|ph_025B-02D0-02E8-02E8|>",
90
+ "<|ph_0075-02D0-02E8-02E9|>",
91
+ "<|ph_0079|>",
92
+ "<|ph_0251-02D0-02E5-02E9|>",
93
+ "<|ph_0065-02D0-02E7|>",
94
+ "<|ph_0074-031A|>",
95
+ "<|ph_0065-02E8-02E8|>",
96
+ "<|ph_0289-02D0-02E5-02E7|>",
97
+ "<|ph_0069-02D0-02E8-02E9|>",
98
+ "<|ph_0075-02D0-02E8-02E9-02C0|>",
99
+ "<|ph_0078|>",
100
+ "<|ph_006B|>",
101
+ "<|ph_0259-02D0-02E8-02E9|>",
102
+ "<|ph_0069-02D0-02E8-02C0-02E5|>",
103
+ "<|ph_0064-0290-02D0|>",
104
+ "<|ph_006F-02E7|>",
105
+ "<|ph_0070-0066|>",
106
+ "<|ph_0282-02D0|>",
107
+ "<|ph_006F-02E8-02E9-02E6|>",
108
+ "<|ph_0268-02D0-02E8-02E9-02E8|>",
109
+ "<|ph_0259-02E9|>",
110
+ "<|ph_0061-02D0-02E8-02E9-02E6|>",
111
+ "<|ph_0268-02D0-02E8-02C0-02E5|>",
112
+ "<|ph_0254-02E5-02E7|>",
113
+ "<|ph_0061-006A|>",
114
+ "<|ph_007A-032A|>",
115
+ "<|ph_007A-02B2-02D0|>",
116
+ "<|ph_0063-0348|>",
117
+ "<|ph_0264-02E6-02E5|>",
118
+ "<|ph_0069-02E8-02E9|>",
119
+ "<|ph_0061-02E8-02C0-02E5|>",
120
+ "<|ph_0061-02D0-02E8-02E6|>",
121
+ "<|ph_0288-0282|>",
122
+ "<|ph_006F-02D0-02E8-02E6|>",
123
+ "<|ph_025B-02D0-02E8-02C0-02E5|>",
124
+ "<|ph_0073-02D0|>",
125
+ "<|ph_0072|>",
126
+ "<|ph_0065-02E5|>",
127
+ "<|ph_0061-02D0-02E8-02E9|>",
128
+ "<|ph_0064-032A-007A-032A-02D0|>",
129
+ "<|ph_0065-02D0-02E8-02E8|>",
130
+ "<|ph_0065-02E9|>",
131
+ "<|ph_0072-02D0|>",
132
+ "<|ph_0077-0303|>",
133
+ "<|ph_006D-0329-02E5|>",
134
+ "<|ph_026F-0061-02E7|>",
135
+ "<|ph_0064-0291|>",
136
+ "<|ph_025B-02E9|>",
137
+ "<|ph_00F8-02D0-02E5-02E7|>",
138
+ "<|ph_026F-0325|>",
139
+ "<|ph_025C-02D0|>",
140
+ "<|ph_0061-02D0-02E8-02E9-02C0|>",
141
+ "<|ph_025F|>",
142
+ "<|ph_0261|>",
143
+ "<|ph_027B|>",
144
+ "<|ph_0061-02E9-02E9-02E6|>",
145
+ "<|ph_0074-032A-02D0|>",
146
+ "<|ph_0270-0303|>",
147
+ "<|ph_025B-02D0-02E7-02E9|>",
148
+ "<|ph_027E-02B2|>",
149
+ "<|ph_0072-02B2|>",
150
+ "<|ph_006F-0077-02E5|>",
151
+ "<|ph_0074-032A|>",
152
+ "<|ph_0074-0255-0348-02D0|>",
153
+ "<|ph_0074-0283|>",
154
+ "<|ph_028F-02E5-02E9|>",
155
+ "<|ph_0064-007A|>",
156
+ "<|ph_0254-02D0-02E9-02E9-02E6|>",
157
+ "<|ph_0074-0255-02D0|>",
158
+ "<|ph_026F-02D0-02E5-02E9|>",
159
+ "<|ph_026F-02E6-02E5|>",
160
+ "<|ph_0065-006A-02E7-02E5|>",
161
+ "<|ph_006B-031A|>",
162
+ "<|ph_0290-0329|>",
163
+ "<|ph_0064|>",
164
+ "<|ph_006F-02D0|>",
165
+ "<|ph_0255-02D0|>",
166
+ "<|ph_0065-02D0-02E8-02E9-02E6|>",
167
+ "<|ph_0061-02D0-02E8-02E9-02E8|>",
168
+ "<|ph_0251-02D0|>",
169
+ "<|ph_0069-02D0-02E5-02E7|>",
170
+ "<|ph_0064-032A-007A-032A|>",
171
+ "<|ph_0069-02D0-02E7-02E9|>",
172
+ "<|ph_0075-02D0-02E8-02E8|>",
173
+ "<|ph_0075-02E8-02E6|>",
174
+ "<|ph_0078-02B7|>",
175
+ "<|ph_00F8-02D0-02E7-02E9|>",
176
+ "<|ph_006D-02B2|>",
177
+ "<|ph_007A-0329|>",
178
+ "<|ph_006D-0329-02E7|>",
179
+ "<|ph_006C|>",
180
+ "<|ph_00F8-02D0-02E5-02E9|>",
181
+ "<|ph_0065-02D0-02E8-02C0-02E5|>",
182
+ "<|ph_006F-02E7-02E5|>",
183
+ "<|ph_0061-0077-02E7-02E5|>",
184
+ "<|ph_006C-0329|>",
185
+ "<|ph_0065-02E8-02C0-02E5|>",
186
+ "<|ph_0061-0077-02E9|>",
187
+ "<|ph_0074-0073-02B2|>",
188
+ "<|ph_0268-0259-02E8-02E9-02E6|>",
189
+ "<|ph_025A|>",
190
+ "<|ph_0065-006A-02E5-02E9|>",
191
+ "<|ph_026F-02D0|>",
192
+ "<|ph_0073-02B2-02D0|>",
193
+ "<|ph_0282|>",
194
+ "<|ph_006A-02D0|>",
195
+ "<|ph_0254-02E8-02E9-02E8|>",
196
+ "<|ph_0275-02E5-02E9|>",
197
+ "<|ph_0076-02B7|>",
198
+ "<|ph_006F-02E6-02E5|>",
199
+ "<|ph_0065-02E9-02E9-02E6|>",
200
+ "<|ph_0153|>",
201
+ "<|ph_026A-02E7-02E9|>",
202
+ "<|ph_025B-02E7|>",
203
+ "<|ph_0061-02D0-02E6-02E5|>",
204
+ "<|ph_0075-0259-02E8-02E6|>",
205
+ "<|ph_0075-0259-02E8-02E9-02C0|>",
206
+ "<|ph_025B-02D0-02E8-02E9-02E8|>",
207
+ "<|ph_028A-02E9|>",
208
+ "<|ph_0062-02B2|>",
209
+ "<|ph_0069-0259-02E8-02E8|>",
210
+ "<|ph_0075-0259-02E6-02E5|>",
211
+ "<|ph_0061-02D0-02E8-02C0-02E5|>",
212
+ "<|ph_0073-0348|>",
213
+ "<|ph_0077-02D0|>",
214
+ "<|ph_0062-02B2-02D0|>",
215
+ "<|ph_0061-02E8-02E9-02E8|>",
216
+ "<|ph_026F-0061-02E9-02E9-02E6|>",
217
+ "<|ph_025B-02E9-02E9-02E6|>",
218
+ "<|ph_0061-0303|>",
219
+ "<|ph_0065-02D0-02E8-02E9|>",
220
+ "<|ph_026F-0061-02E6-02E5|>",
221
+ "<|ph_0074-0348-02B2|>",
222
+ "<|ph_0075-02E8-02E9-02E8|>",
223
+ "<|ph_014B-030D|>",
224
+ "<|ph_0075-02D0-02E8-02E9-02E8|>",
225
+ "<|ph_0065-006A-02E7|>",
226
+ "<|ph_0268-0259-02E8-02E9-02C0|>",
227
+ "<|ph_0074-0255|>",
228
+ "<|ph_0069-0259-02E8-02E9-02C0|>",
229
+ "<|ph_0259-02E8-02E9|>",
230
+ "<|ph_0065-02E8-02E9-02E8|>",
231
+ "<|ph_026F|>",
232
+ "<|ph_025B-02D0-02E8-02E6|>",
233
+ "<|ph_0278-02B7|>",
234
+ "<|ph_006F-02D0-02E8-02E9-02E8|>",
235
+ "<|ph_0075-02D0-02E8-02C0-02E5|>",
236
+ "<|ph_006E-0329-02E7-02E5|>",
237
+ "<|ph_025F-029D|>",
238
+ "<|ph_0076|>",
239
+ "<|ph_006F-0303|>",
240
+ "<|ph_0069-02E8-02E9-02E6|>",
241
+ "<|ph_0259-02D0-02E8-02E9-02E6|>",
242
+ "<|ph_0079-02E8-02E9-02E6|>",
243
+ "<|ph_0070-02B7|>",
244
+ "<|ph_0075-0259-02E8-02E9|>",
245
+ "<|ph_025F-02D0|>",
246
+ "<|ph_025B-02D0-02E5-02E9|>",
247
+ "<|ph_0254-02E8-02E6|>",
248
+ "<|ph_026A-02E5-02E7|>",
249
+ "<|ph_026B-02D0|>",
250
+ "<|ph_025B-02D0-02E5-02E7|>",
251
+ "<|ph_0065-02E8-02E9-02C0|>",
252
+ "<|ph_0274-02D0|>",
253
+ "<|ph_0061-0077-02E8-02E9-02E6|>",
254
+ "<|ph_0065|>",
255
+ "<|ph_0076-02B2|>",
256
+ "<|ph_0268-0259-02E8-02E8|>",
257
+ "<|ph_0074-0348|>",
258
+ "<|ph_0254-02D0-02E6-02E5|>",
259
+ "<|ph_0074-0255-02B7-02D0|>",
260
+ "<|ph_006E-0329|>",
261
+ "<|ph_00F8-02D0|>",
262
+ "<|ph_0254|>",
263
+ "<|ph_0069-02D0-02E8-02E8|>",
264
+ "<|ph_0075-02D0-02E6-02E5|>",
265
+ "<|ph_0066-02B2|>",
266
+ "<|ph_006F-02D0-02E8-02C0-02E5|>",
267
+ "<|ph_0290-02D0|>",
268
+ "<|ph_00E7-02D0|>",
269
+ "<|ph_0264-02D0-02E5-02E9|>",
270
+ "<|ph_006F|>",
271
+ "<|ph_0069-0259-02E8-02E9-02E6|>",
272
+ "<|ph_0069-02D0-02E8-02E9-02E6|>",
273
+ "<|ph_0267|>",
274
+ "<|ph_0259-02D0-02E8-02E8|>",
275
+ "<|ph_0272-02D0|>",
276
+ "<|ph_0268-0259-02E8-02E9|>",
277
+ "<|ph_014B-030D-02E7-02E5|>",
278
+ "<|ph_006F-02D0-02E9-02E9-02E6|>",
279
+ "<|ph_0261-0062|>",
280
+ "<|ph_0061-02E6-02E5|>",
281
+ "<|ph_014B-006D|>",
282
+ "<|ph_0283|>",
283
+ "<|ph_028E-02D0|>",
284
+ "<|ph_029D|>",
285
+ "<|ph_0062-02B7|>",
286
+ "<|ph_0074-0255-02B7|>",
287
+ "<|ph_0074-02B2-02D0|>",
288
+ "<|ph_028F-02E7-02E9|>",
289
+ "<|ph_0288-02B0|>",
290
+ "<|ph_0072-02B2-02D0|>",
291
+ "<|ph_0259-02E6-02E5|>",
292
+ "<|ph_0069-02D0-02E8-02E9-02C0|>",
293
+ "<|ph_0268-0259-02E8-02E9-02E8|>",
294
+ "<|ph_0075-02E5-02E9|>",
295
+ "<|ph_0077|>",
296
+ "<|ph_0268-02E8-02E9-02E6|>",
297
+ "<|ph_026F-02E5-02E9|>",
298
+ "<|ph_026F-02E7|>",
299
+ "<|ph_0069-02D0-02E7|>",
300
+ "<|ph_0075-02E7|>",
301
+ "<|ph_006D-0329|>",
302
+ "<|ph_026B-0329|>",
303
+ "<|ph_025B-02E5-02E9|>",
304
+ "<|ph_0289-02D0-02E7-02E9|>",
305
+ "<|ph_0073-032A-02D0|>",
306
+ "<|ph_0259-02D0-02E8-02C0-02E5|>",
307
+ "<|ph_0075-0061-02E7|>",
308
+ "<|ph_0290-0329-02E7-02E5|>",
309
+ "<|ph_0075-0061-02E9-02E9-02E6|>",
310
+ "<|ph_0062-02D0|>",
311
+ "<|ph_025B-02D0|>",
312
+ "<|ph_025D|>",
313
+ "<|ph_0264-02E8-02E9|>",
314
+ "<|ph_0074|>",
315
+ "<|ph_0254-02D0-02E8-02E8|>",
316
+ "<|ph_0069-02D0-02E8-02E9-02E8|>",
317
+ "<|ph_0254-02E7|>",
318
+ "<|ph_0065-02D0-02E9|>",
319
+ "<|ph_0061-006A-02E7|>",
320
+ "<|ph_006D|>",
321
+ "<|ph_0061-02E8-02E9|>",
322
+ "<|ph_0268-02E8-02C0-02E5|>",
323
+ "<|ph_00E6|>",
324
+ "<|ph_0074-02D0|>",
325
+ "<|ph_0065-02E8-02E9-02E6|>",
326
+ "<|ph_0073-0348-02D0|>",
327
+ "<|ph_0069-02E7|>",
328
+ "<|ph_0268-0259-02E8-02C0-02E5|>",
329
+ "<|ph_0079-02E5-02E9|>",
330
+ "<|ph_006E-032A-02D0|>",
331
+ "<|ph_0075-02D0-02E8-02E9-02E6|>",
332
+ "<|ph_0153-02E5-02E9|>",
333
+ "<|ph_0063-02B7|>",
334
+ "<|ph_0074-032A-02B0|>",
335
+ "<|ph_0275|>",
336
+ "<|ph_0063-02B0-02D0|>",
337
+ "<|ph_006F-02E5|>",
338
+ "<|ph_0075-0061-02E6-02E5|>",
339
+ "<|ph_0069-02D0-02E9-02E9-02E6|>",
340
+ "<|ph_0270|>",
341
+ "<|ph_0261-02B7|>",
342
+ "<|ph_0254-02D0-02E5-02E9|>",
343
+ "<|ph_028C|>",
344
+ "<|ph_0268|>",
345
+ "<|ph_026F-02D0-02E7|>",
346
+ "<|ph_0069-0259-02E8-02E9-02E8|>",
347
+ "<|ph_0074-032A-0073-032A-02D0|>",
348
+ "<|ph_025C|>",
349
+ "<|ph_0064-0291-02B7|>",
350
+ "<|ph_028F|>",
351
+ "<|ph_0257|>",
352
+ "<|ph_0070-0348-02B7|>",
353
+ "<|ph_0074-0255-0348-02B7|>",
354
+ "<|ph_0292|>",
355
+ "<|ph_03B2|>",
356
+ "<|ph_0063-02B0|>",
357
+ "<|ph_00F8-02D0-02E9|>",
358
+ "<|ph_0069-02E8-02E9-02C0|>",
359
+ "<|ph_0061-02E7|>",
360
+ "<|ph_0064-0292|>",
361
+ "<|ph_0268-02E8-02E9-02C0|>",
362
+ "<|ph_0263|>",
363
+ "<|ph_0288|>",
364
+ "<|ph_0283-02D0|>",
365
+ "<|ph_006F-02E8-02E8|>",
366
+ "<|ph_0061-006A-02E5-02E9|>",
367
+ "<|ph_0153-02E7-02E9|>",
368
+ "<|ph_0069-0061-02E6-02E5|>",
369
+ "<|ph_0294|>",
370
+ "<|ph_0064-02B2-02D0|>",
371
+ "<|ph_027E-02D0|>",
372
+ "<|ph_0061-006A-02E5|>",
373
+ "<|ph_0069-02E8-02E6|>",
374
+ "<|ph_028C-02D0|>",
375
+ "<|ph_0252|>",
376
+ "<|ph_0065-02D0-02E8-02E6|>",
377
+ "<|ph_0278-02D0|>",
378
+ "<|ph_006F-0077-02E8-02E9-02E6|>",
379
+ "<|ph_0266|>",
380
+ "<|ph_0069-02E5|>",
381
+ "<|ph_0254-02E9|>",
382
+ "<|ph_0065-006A-02E8-02E9-02E6|>",
383
+ "<|ph_0074-02B0|>",
384
+ "<|ph_0264-02E9-02E9-02E6|>",
385
+ "<|ph_006E-0329-02E8-02E9-02E6|>",
386
+ "<|ph_0064-0291-02D0|>",
387
+ "<|ph_0255|>",
388
+ "<|ph_0064-02D0|>",
389
+ "<|ph_0259-02D0-02E6-02E5|>",
390
+ "<|ph_007A-0329-02E5|>",
391
+ "<|ph_0075-02E7-02E5|>",
392
+ "<|ph_0079-02E7-02E5|>",
393
+ "<|ph_0075-0259-02E8-02C0-02E5|>",
394
+ "<|ph_0254-02E8-02E9-02C0|>",
395
+ "<|ph_0075-02D0-02E5-02E7|>",
396
+ "<|ph_0069-0061-02E9-02E9-02E6|>",
397
+ "<|ph_006F-02D0-02E7-02E9|>",
398
+ "<|ph_0268-02E8-02E6|>",
399
+ "<|ph_006F-02D0-02E8-02E9-02C0|>",
400
+ "<|ph_006F-02D0-02E5-02E7|>",
401
+ "<|ph_0061-02E8-02E9-02C0|>",
402
+ "<|ph_0254-02D0-02E8-02C0-02E5|>",
403
+ "<|ph_0061-02D0-02E7|>",
404
+ "<|ph_0268-0259-02E8-02E6|>",
405
+ "<|ph_0064-007A-02B2-02D0|>",
406
+ "<|ph_0069-02E8-02E9-02E8|>",
407
+ "<|ph_0076-02B2-02D0|>",
408
+ "<|ph_0065-02D0|>",
409
+ "<|ph_0290-0329-02E8-02E9-02E6|>",
410
+ "<|ph_006E-02D0|>",
411
+ "<|ph_0075-0259-02E8-02E9-02E6|>",
412
+ "<|ph_0073-02B7|>",
413
+ "<|ph_007A-0329-02E5-02E9|>",
414
+ "<|ph_0075-02D0|>",
415
+ "<|ph_0074-0283-02D0|>",
416
+ "<|ph_0288-0282-02B0|>",
417
+ "<|ph_026A-02E5-02E9|>",
418
+ "<|ph_014B|>",
419
+ "<|ph_0079-02E7|>",
420
+ "<|ph_006B-02B0|>",
421
+ "<|ph_0069-02E5-02E9|>",
422
+ "<|ph_0259-02E8-02E8|>",
423
+ "<|ph_0070-0348-02D0|>",
424
+ "<|ph_0274|>",
425
+ "<|ph_0061-02D0-02E8-02E8|>",
426
+ "<|ph_0070-0348|>",
427
+ "<|ph_0259-02D0-02E8-02E9-02E8|>",
428
+ "<|ph_006F-02E8-02E9-02E8|>",
429
+ "<|ph_006B-02B7|>",
430
+ "<|ph_007A-02B2|>",
431
+ "<|ph_0074-02B7-02D0|>",
432
+ "<|ph_00F8|>",
433
+ "<|ph_026A-02E9|>",
434
+ "<|ph_0074-0255-02B0|>",
435
+ "<|ph_0251-0303|>",
436
+ "<|ph_0074-0348-02D0|>",
437
+ "<|ph_0259-02E7-02E5|>",
438
+ "<|ph_006B-02B7-02D0|>",
439
+ "<|ph_0074-032A-0073-032A|>",
440
+ "<|ph_0268-02D0-02E6-02E5|>",
441
+ "<|ph_0061|>",
442
+ "<|ph_0069-02E7-02E5|>",
443
+ "<|ph_0078-02D0|>",
444
+ "<|ph_0075-02E8-02E9|>",
445
+ "<|ph_0070-02B2|>",
446
+ "<|ph_0271|>",
447
+ "<|ph_0075-0259-02E8-02E8|>",
448
+ "<|ph_006F-02E8-02E6|>",
449
+ "<|ph_0075-02E5|>",
450
+ "<|ph_0290-0329-02E9|>",
451
+ "<|ph_0068-02D0|>",
452
+ "<|ph_0259-02E5-02E9|>",
453
+ "<|ph_0075-02E8-02E9-02C0|>",
454
+ "<|ph_0065-006A-02E9|>",
455
+ "<|ph_0069-0061-02E8-02E9|>",
456
+ "<|ph_006C-032A|>",
457
+ "<|ph_0069-02E6-02E5|>",
458
+ "<|ph_0074-0282-02D0|>",
459
+ "<|ph_006F-02E9|>",
460
+ "<|ph_03B2-02B7|>",
461
+ "<|ph_0268-0325|>",
462
+ "<|ph_0278-02B2-02D0|>",
463
+ "<|ph_0064-007A-02D0|>",
464
+ "<|ph_0268-02D0-02E8-02E9|>",
465
+ "<|ph_0074-0073-02B0|>",
466
+ "<|ph_006D-0329-02E8-02E9-02E6|>",
467
+ "<|ph_0079-02D0-02E9|>",
468
+ "<|ph_0074-02B2|>",
469
+ "<|ph_0259-02E8-02E9-02E8|>",
470
+ "<|ph_0061-0077|>",
471
+ "<|ph_0069-0061-02E7|>",
472
+ "<|ph_0074-0073-02D0|>",
473
+ "<|ph_006A-0303|>",
474
+ "<|ph_0064-02B7|>",
475
+ "<|ph_007A-032A-02D0|>",
476
+ "<|ph_0254-02D0-02E8-02E9-02C0|>",
477
+ "<|ph_0259-02E8-02E9-02C0|>",
478
+ "<|ph_006F-02D0-02E8-02E9|>",
479
+ "<|ph_0251|>",
480
+ "<|ph_0065-02D0-02E5-02E9|>",
481
+ "<|ph_0066-02D0|>",
482
+ "<|ph_0065-02D0-02E8-02E9-02C0|>",
483
+ "<|ph_0069-02D0-02E5-02E9|>",
484
+ "<|ph_0268-02D0-02E8-02E8|>",
485
+ "<|ph_026F-02D0-02E9-02E9-02E6|>",
486
+ "<|ph_0061-02E9|>",
487
+ "<|ph_007A-0329-02E9|>",
488
+ "<|ph_0272|>",
489
+ "<|ph_026A|>",
490
+ "<|ph_0075-02E8-02C0-02E5|>",
491
+ "<|ph_0061-02E8-02E6|>",
492
+ "<|ph_0066-02B7|>",
493
+ "<|ph_0065-02D0-02E9-02E9-02E6|>",
494
+ "<|ph_0259-02D0-02E8-02E6|>",
495
+ "<|ph_0291-02D0|>",
496
+ "<|ph_0259-02E8-02C0-02E5|>",
497
+ "<|ph_0065-006A-02E5|>",
498
+ "<|ph_006D-02D0|>",
499
+ "<|ph_0254-02E7-02E9|>",
500
+ "<|ph_0069-02E8-02C0-02E5|>",
501
+ "<|ph_0254-02E6-02E5|>",
502
+ "<|ph_027E-0303|>",
503
+ "<|ph_0061-006A-02E7-02E5|>",
504
+ "<|ph_0079-02D0-02E5-02E9|>",
505
+ "<|ph_026D|>",
506
+ "<|ph_0289-02D0|>",
507
+ "<|ph_0075-02E8-02E8|>",
508
+ "<|ph_025B-02D0-02E9-02E9-02E6|>",
509
+ "<|ph_0264-02D0-02E7|>",
510
+ "<|ph_006F-02D0-02E8-02E9-02E6|>",
511
+ "<|ph_014B-030D-02E5-02E9|>",
512
+ "<|ph_0254-028F|>",
513
+ "<|ph_006B-02B0-02D0|>",
514
+ "<|ph_025B-02E5-02E7|>",
515
+ "<|ph_025B-02E7-02E9|>",
516
+ "<|ph_0075-0259-02E8-02E9-02E8|>",
517
+ "<|ph_0061-006A-02E8-02E9-02E6|>",
518
+ "<|ph_0069-0259-02E6-02E5|>",
519
+ "<|ph_0069-0303|>",
520
+ "<|ph_025B-02D0-02E8-02E9|>",
521
+ "<|ph_025B|>",
522
+ "<|ph_0264-02E5-02E9|>",
523
+ "<|ph_026B|>",
524
+ "<|ph_0264-02E7|>",
525
+ "<|ph_0268-02E8-02E8|>",
526
+ "<|ph_0068|>",
527
+ "<|ph_028B|>",
528
+ "<|ph_0065-02E5-02E9|>",
529
+ "<|ph_0254-02E8-02E9-02E6|>",
530
+ "<|ph_0264-02D0-02E8-02E9|>",
531
+ "<|ph_0073-0069-006C|>",
532
+ "<|ph_0069-02D0-02E6-02E5|>",
533
+ "<|ph_0061-02D0-02E5-02E9|>",
534
+ "<|ph_025B-02D0-02E6-02E5|>",
535
+ "<|ph_027E-02B7|>",
536
+ "<|ph_0073-02B0-02D0|>",
537
+ "<|ph_025B-0303|>",
538
+ "<|ph_006F-02D0-02E5-02E9|>",
539
+ "<|ph_0254-02E8-02E9|>",
540
+ "<|ph_006E-032A|>",
541
+ "<|ph_006A|>",
542
+ "<|ph_0264-02D0-02E6-02E5|>",
543
+ "<|ph_0070-02D0|>",
544
+ "<|ph_0065-02D0-02E6-02E5|>",
545
+ "<|ph_0254-02E9-02E9-02E6|>",
546
+ "<|ph_00F0|>",
547
+ "<|ph_0253|>",
548
+ "<|ph_0275-02E7-02E9|>",
549
+ "<|ph_0064-032A|>",
550
+ "<|ph_0073-02B2|>",
551
+ "<|ph_0290-0329-02E5|>",
552
+ "<|ph_025B-02D0-02E8-02E9-02C0|>",
553
+ "<|ph_0063|>",
554
+ "<|ph_006E|>",
555
+ "<|ph_006F-0077-02E9|>",
556
+ "<|ph_0079-02D0-02E5-02E7|>",
557
+ "<|ph_0070|>",
558
+ "<|ph_028F-02E5-02E7|>",
559
+ "<|ph_0075-02E6-02E5|>",
560
+ "<|ph_0073-02B0|>",
561
+ "<|ph_006F-02D0-02E7|>",
562
+ "<|ph_0069-02D0|>",
563
+ "<|ph_0268-0259-02E6-02E5|>",
564
+ "<|ph_0061-02D0|>",
565
+ "<|ph_0075-02D0-02E7|>",
566
+ "<|ph_006B-0348-02B7|>",
567
+ "<|ph_0070-02B0-02D0|>",
568
+ "<|ph_0065-02E6-02E5|>",
569
+ "<|ph_0069-0325|>",
570
+ "<|ph_0066|>",
571
+ "<|ph_0075|>",
572
+ "<|ph_0069-02E9-02E9-02E6|>",
573
+ "<|ph_0062|>",
574
+ "<|ph_0063-02D0|>",
575
+ "<|ph_0273|>",
576
+ "<|ph_0254-02D0-02E8-02E9|>",
577
+ "<|ph_0065-02D0-02E5-02E7|>",
578
+ "<|ph_03B8|>",
579
+ "<|ph_0061-006A-02E9|>",
580
+ "<|ph_0061-02E7-02E9|>",
581
+ "<|ph_0069-02D0-02E8-02E6|>",
582
+ "<|ph_006D-0329-02E5-02E9|>",
583
+ "<|ph_026F-02D0-02E8-02E9|>",
584
+ "<|ph_0075-02D0-02E5-02E9|>",
585
+ "<|ph_0291|>",
586
+ "<|ph_0065-02E7-02E5|>",
587
+ "<|ph_0268-02D0-02E8-02E9-02C0|>",
588
+ "<|ph_0061-02E5-02E9|>",
589
+ "<|ph_028A-02E7-02E9|>",
590
+ "<|ph_0268-02E8-02E9-02E8|>",
591
+ "<|ph_026F-02E8-02E9|>",
592
+ "<|ph_0259-02E7|>",
593
+ "<|ph_0061-02E7-02E5|>",
594
+ "<|ph_0065-02E8-02E9|>",
595
+ "<|ph_0069-0259-02E8-02E9|>",
596
+ "<|ph_006F-02E8-02E9|>",
597
+ "<|ph_0061-02E8-02E8|>",
598
+ "<|ph_006F-0077-02E5-02E9|>",
599
+ "<|ph_0075-02D0-02E7-02E9|>",
600
+ "<|ph_0065-0303|>",
601
+ "<|ph_0254-02E8-02C0-02E5|>",
602
+ "<|ph_0268-02E8-02E9|>",
603
+ "<|ph_006D-0329-02E7-02E5|>",
604
+ "<|ph_006E-0329-02E5-02E9|>",
605
+ "<|ph_0290-0329-02E7|>",
606
+ "<|ph_0075-02E9|>",
607
+ "<|ph_006F-0077|>",
608
+ "<|ph_0290-0329-02E5-02E9|>",
609
+ "<|ph_0254-0303|>",
610
+ "<|ph_0254-02E8-02E8|>",
611
+ "<|ph_006B-0348|>",
612
+ "<|ph_0079-02D0|>",
613
+ "<|ph_0250|>",
614
+ "<|ph_0075-02D0-02E8-02E6|>",
615
+ "<|ph_026F-0061-02E5-02E9|>",
616
+ "<|ph_025B-02E6-02E5|>",
617
+ "<|ph_0074-0255-02B0-02D0|>",
618
+ "<|ph_0075-0061-02E5-02E9|>",
619
+ "<|ph_0064-0290|>",
620
+ "<|ph_0259-02E8-02E6|>",
621
+ "<|ph_0281|>",
622
+ "<|ph_0061-02D0-02E9-02E9-02E6|>",
623
+ "<|ph_0256|>",
624
+ "<|ph_0288-02B7|>",
625
+ "<|ph_025B-02D0-02E8-02E9-02E6|>",
626
+ "<|ph_0070-02B0|>",
627
+ "<|ph_0254-006A|>",
628
+ "<|ph_026D-02D0|>",
629
+ "<|ph_006F-02E5-02E9|>",
630
+ "<|ph_0061-0077-02E7|>",
631
+ "<|ph_0074-0282|>",
632
+ "<|ph_0255-02B0|>",
633
+ "<|ph_006B-0070|>",
634
+ "<|ph_0251-02D0-02E7-02E9|>",
635
+ "<|ph_026F-0061-02E8-02E9|>",
636
+ "<|ph_014B-030D-02E8-02E9-02E6|>",
637
+ "<|ph_0061-02E8-02E9-02E6|>",
638
+ "<|ph_0073-032A|>",
639
+ "<|ph_0065-02E7|>",
640
+ "<|ph_0079-02D0-02E7-02E9|>",
641
+ "<|ph_006F-02D0-02E6-02E5|>",
642
+ "<|ph_0074-02B0-02D0|>",
643
+ "<|ph_0251-02D0-02E5-02E7|>",
644
+ "<|ph_0259|>",
645
+ "<|ph_0061-02E5|>",
646
+ "<|ph_0278|>",
647
+ "<|ph_0268-02D0-02E8-02E6|>",
648
+ "<|ph_027E|>",
649
+ "<|ph_027E-02B2-02D0|>",
650
+ "<|ph_006F-02D0-02E9|>",
651
+ "<|ph_0268-02D0-02E8-02E9-02E6|>",
652
+ "<|ph_006F-02E8-02E9-02C0|>",
653
+ "<|ph_006D-02B2-02D0|>",
654
+ "<|ph_0289-02D0-02E5-02E9|>",
655
+ "<|ph_0074-0255-0348|>"
656
+ ],
657
+ "bos_token": {
658
+ "content": "<|begin_of_text|>",
659
+ "lstrip": false,
660
+ "normalized": false,
661
+ "rstrip": false,
662
+ "single_word": false
663
+ },
664
+ "eos_token": {
665
+ "content": "<|eot_id|>",
666
+ "lstrip": false,
667
+ "normalized": false,
668
+ "rstrip": false,
669
+ "single_word": false
670
+ },
671
+ "pad_token": {
672
+ "content": "<|eot_id|>",
673
+ "lstrip": false,
674
+ "normalized": false,
675
+ "rstrip": false,
676
+ "single_word": false
677
+ }
678
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29da3b5cfb25e3d531cc3e07fd5b22d40cf644e5df9f99307c467b59bf825a9a
3
+ size 29650442
tokenizer_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c77d48da4cbf813726cb90cc11fa675afeec3b90649b32834c1b3eb68ce4f639
3
+ size 11847842