seranky-nv12 commited on
Commit
5f947e2
·
verified ·
1 Parent(s): 2a14915

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +4 -0
  2. README.md +61 -0
  3. adapter_config.json +49 -0
  4. adapter_model.safetensors +3 -0
  5. chat_template.jinja +331 -0
  6. checkpoint-1642/README.md +208 -0
  7. checkpoint-1642/adapter_config.json +49 -0
  8. checkpoint-1642/adapter_model.safetensors +3 -0
  9. checkpoint-1642/chat_template.jinja +331 -0
  10. checkpoint-1642/optimizer.pt +3 -0
  11. checkpoint-1642/rng_state_0.pth +3 -0
  12. checkpoint-1642/rng_state_1.pth +3 -0
  13. checkpoint-1642/rng_state_2.pth +3 -0
  14. checkpoint-1642/rng_state_3.pth +3 -0
  15. checkpoint-1642/rng_state_4.pth +3 -0
  16. checkpoint-1642/rng_state_5.pth +3 -0
  17. checkpoint-1642/rng_state_6.pth +3 -0
  18. checkpoint-1642/rng_state_7.pth +3 -0
  19. checkpoint-1642/scheduler.pt +3 -0
  20. checkpoint-1642/special_tokens_map.json +1817 -0
  21. checkpoint-1642/tokenizer.json +3 -0
  22. checkpoint-1642/tokenizer_config.json +2489 -0
  23. checkpoint-1642/trainer_state.json +1510 -0
  24. checkpoint-1642/training_args.bin +3 -0
  25. checkpoint-3284/README.md +208 -0
  26. checkpoint-3284/adapter_config.json +49 -0
  27. checkpoint-3284/adapter_model.safetensors +3 -0
  28. checkpoint-3284/chat_template.jinja +331 -0
  29. checkpoint-3284/optimizer.pt +3 -0
  30. checkpoint-3284/rng_state_0.pth +3 -0
  31. checkpoint-3284/rng_state_1.pth +3 -0
  32. checkpoint-3284/rng_state_2.pth +3 -0
  33. checkpoint-3284/rng_state_3.pth +3 -0
  34. checkpoint-3284/rng_state_4.pth +3 -0
  35. checkpoint-3284/rng_state_5.pth +3 -0
  36. checkpoint-3284/rng_state_6.pth +3 -0
  37. checkpoint-3284/rng_state_7.pth +3 -0
  38. checkpoint-3284/scheduler.pt +3 -0
  39. checkpoint-3284/special_tokens_map.json +1817 -0
  40. checkpoint-3284/tokenizer.json +3 -0
  41. checkpoint-3284/tokenizer_config.json +2489 -0
  42. checkpoint-3284/trainer_state.json +2986 -0
  43. checkpoint-3284/training_args.bin +3 -0
  44. checkpoint-4926/README.md +208 -0
  45. checkpoint-4926/adapter_config.json +49 -0
  46. checkpoint-4926/adapter_model.safetensors +3 -0
  47. checkpoint-4926/chat_template.jinja +331 -0
  48. checkpoint-4926/optimizer.pt +3 -0
  49. checkpoint-4926/rng_state_0.pth +3 -0
  50. checkpoint-4926/rng_state_1.pth +3 -0
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ checkpoint-1642/tokenizer.json filter=lfs diff=lfs merge=lfs -text
37
+ checkpoint-3284/tokenizer.json filter=lfs diff=lfs merge=lfs -text
38
+ checkpoint-4926/tokenizer.json filter=lfs diff=lfs merge=lfs -text
39
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: openai/gpt-oss-20b
3
+ library_name: peft
4
+ model_name: gpt-oss-20b-finetuned
5
+ tags:
6
+ - base_model:adapter:openai/gpt-oss-20b
7
+ - lora
8
+ - sft
9
+ - transformers
10
+ - trl
11
+ licence: license
12
+ ---
13
+
14
+ # Model Card for gpt-oss-20b-finetuned
15
+
16
+ This model is a fine-tuned version of [openai/gpt-oss-20b](https://huggingface.co/openai/gpt-oss-20b).
17
+ It has been trained using [TRL](https://github.com/huggingface/trl).
18
+
19
+ ## Quick start
20
+
21
+ ```python
22
+ from transformers import pipeline
23
+
24
+ question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
25
+ generator = pipeline("text-generation", model="None", device="cuda")
26
+ output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
27
+ print(output["generated_text"])
28
+ ```
29
+
30
+ ## Training procedure
31
+
32
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/srikar-eranky-uc-san-diego/dos-expert/runs/evauaygh)
33
+
34
+
35
+ This model was trained with SFT.
36
+
37
+ ### Framework versions
38
+
39
+ - PEFT 0.17.1
40
+ - TRL: 0.21.0
41
+ - Transformers: 4.55.4
42
+ - Pytorch: 2.7.1+cu118
43
+ - Datasets: 4.0.0
44
+ - Tokenizers: 0.21.4
45
+
46
+ ## Citations
47
+
48
+
49
+
50
+ Cite TRL as:
51
+
52
+ ```bibtex
53
+ @misc{vonwerra2022trl,
54
+ title = {{TRL: Transformer Reinforcement Learning}},
55
+ author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallou{\'e}dec},
56
+ year = 2020,
57
+ journal = {GitHub repository},
58
+ publisher = {GitHub},
59
+ howpublished = {\url{https://github.com/huggingface/trl}}
60
+ }
61
+ ```
adapter_config.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "GptOssForCausalLM",
5
+ "parent_library": "transformers.models.gpt_oss.modeling_gpt_oss"
6
+ },
7
+ "base_model_name_or_path": "openai/gpt-oss-20b",
8
+ "bias": "none",
9
+ "corda_config": null,
10
+ "eva_config": null,
11
+ "exclude_modules": null,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": true,
15
+ "layer_replication": null,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "loftq_config": {},
19
+ "lora_alpha": 16,
20
+ "lora_bias": false,
21
+ "lora_dropout": 0.0,
22
+ "megatron_config": null,
23
+ "megatron_core": "megatron.core",
24
+ "modules_to_save": null,
25
+ "peft_type": "LORA",
26
+ "qalora_group_size": 16,
27
+ "r": 8,
28
+ "rank_pattern": {},
29
+ "revision": null,
30
+ "target_modules": [
31
+ "o_proj",
32
+ "k_proj",
33
+ "v_proj",
34
+ "q_proj"
35
+ ],
36
+ "target_parameters": [
37
+ "7.mlp.experts.gate_up_proj",
38
+ "7.mlp.experts.down_proj",
39
+ "15.mlp.experts.gate_up_proj",
40
+ "15.mlp.experts.down_proj",
41
+ "23.mlp.experts.gate_up_proj",
42
+ "23.mlp.experts.down_proj"
43
+ ],
44
+ "task_type": null,
45
+ "trainable_token_indices": null,
46
+ "use_dora": false,
47
+ "use_qalora": false,
48
+ "use_rslora": false
49
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a12fc000b95c82bac6a99a48756a04e45988fdbd7cf08e8fc7d3059abbcb8677
3
+ size 2366470368
chat_template.jinja ADDED
@@ -0,0 +1,331 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {#-
2
+ In addition to the normal inputs of `messages` and `tools`, this template also accepts the
3
+ following kwargs:
4
+ - "builtin_tools": A list, can contain "browser" and/or "python".
5
+ - "model_identity": A string that optionally describes the model identity.
6
+ - "reasoning_effort": A string that describes the reasoning effort, defaults to "medium".
7
+ #}
8
+
9
+ {#- Tool Definition Rendering ============================================== #}
10
+ {%- macro render_typescript_type(param_spec, required_params, is_nullable=false) -%}
11
+ {%- if param_spec.type == "array" -%}
12
+ {%- if param_spec['items'] -%}
13
+ {%- if param_spec['items']['type'] == "string" -%}
14
+ {{- "string[]" }}
15
+ {%- elif param_spec['items']['type'] == "number" -%}
16
+ {{- "number[]" }}
17
+ {%- elif param_spec['items']['type'] == "integer" -%}
18
+ {{- "number[]" }}
19
+ {%- elif param_spec['items']['type'] == "boolean" -%}
20
+ {{- "boolean[]" }}
21
+ {%- else -%}
22
+ {%- set inner_type = render_typescript_type(param_spec['items'], required_params) -%}
23
+ {%- if inner_type == "object | object" or inner_type|length > 50 -%}
24
+ {{- "any[]" }}
25
+ {%- else -%}
26
+ {{- inner_type + "[]" }}
27
+ {%- endif -%}
28
+ {%- endif -%}
29
+ {%- if param_spec.nullable -%}
30
+ {{- " | null" }}
31
+ {%- endif -%}
32
+ {%- else -%}
33
+ {{- "any[]" }}
34
+ {%- if param_spec.nullable -%}
35
+ {{- " | null" }}
36
+ {%- endif -%}
37
+ {%- endif -%}
38
+ {%- elif param_spec.type is defined and param_spec.type is iterable and param_spec.type is not string and param_spec.type is not mapping and param_spec.type[0] is defined -%}
39
+ {#- Handle array of types like ["object", "object"] from Union[dict, list] #}
40
+ {%- if param_spec.type | length > 1 -%}
41
+ {{- param_spec.type | join(" | ") }}
42
+ {%- else -%}
43
+ {{- param_spec.type[0] }}
44
+ {%- endif -%}
45
+ {%- elif param_spec.oneOf -%}
46
+ {#- Handle oneOf schemas - check for complex unions and fallback to any #}
47
+ {%- set has_object_variants = false -%}
48
+ {%- for variant in param_spec.oneOf -%}
49
+ {%- if variant.type == "object" -%}
50
+ {%- set has_object_variants = true -%}
51
+ {%- endif -%}
52
+ {%- endfor -%}
53
+ {%- if has_object_variants and param_spec.oneOf|length > 1 -%}
54
+ {{- "any" }}
55
+ {%- else -%}
56
+ {%- for variant in param_spec.oneOf -%}
57
+ {{- render_typescript_type(variant, required_params) -}}
58
+ {%- if variant.description %}
59
+ {{- "// " + variant.description }}
60
+ {%- endif -%}
61
+ {%- if variant.default is defined %}
62
+ {{ "// default: " + variant.default|tojson }}
63
+ {%- endif -%}
64
+ {%- if not loop.last %}
65
+ {{- " | " }}
66
+ {% endif -%}
67
+ {%- endfor -%}
68
+ {%- endif -%}
69
+ {%- elif param_spec.type == "string" -%}
70
+ {%- if param_spec.enum -%}
71
+ {{- '"' + param_spec.enum|join('" | "') + '"' -}}
72
+ {%- else -%}
73
+ {{- "string" }}
74
+ {%- if param_spec.nullable %}
75
+ {{- " | null" }}
76
+ {%- endif -%}
77
+ {%- endif -%}
78
+ {%- elif param_spec.type == "number" -%}
79
+ {{- "number" }}
80
+ {%- elif param_spec.type == "integer" -%}
81
+ {{- "number" }}
82
+ {%- elif param_spec.type == "boolean" -%}
83
+ {{- "boolean" }}
84
+
85
+ {%- elif param_spec.type == "object" -%}
86
+ {%- if param_spec.properties -%}
87
+ {{- "{\n" }}
88
+ {%- for prop_name, prop_spec in param_spec.properties.items() -%}
89
+ {{- prop_name -}}
90
+ {%- if prop_name not in (param_spec.required or []) -%}
91
+ {{- "?" }}
92
+ {%- endif -%}
93
+ {{- ": " }}
94
+ {{ render_typescript_type(prop_spec, param_spec.required or []) }}
95
+ {%- if not loop.last -%}
96
+ {{-", " }}
97
+ {%- endif -%}
98
+ {%- endfor -%}
99
+ {{- "}" }}
100
+ {%- else -%}
101
+ {{- "object" }}
102
+ {%- endif -%}
103
+ {%- else -%}
104
+ {{- "any" }}
105
+ {%- endif -%}
106
+ {%- endmacro -%}
107
+
108
+ {%- macro render_tool_namespace(namespace_name, tools) -%}
109
+ {{- "## " + namespace_name + "\n\n" }}
110
+ {{- "namespace " + namespace_name + " {\n\n" }}
111
+ {%- for tool in tools %}
112
+ {%- set tool = tool.function %}
113
+ {{- "// " + tool.description + "\n" }}
114
+ {{- "type "+ tool.name + " = " }}
115
+ {%- if tool.parameters and tool.parameters.properties %}
116
+ {{- "(_: {\n" }}
117
+ {%- for param_name, param_spec in tool.parameters.properties.items() %}
118
+ {%- if param_spec.description %}
119
+ {{- "// " + param_spec.description + "\n" }}
120
+ {%- endif %}
121
+ {{- param_name }}
122
+ {%- if param_name not in (tool.parameters.required or []) -%}
123
+ {{- "?" }}
124
+ {%- endif -%}
125
+ {{- ": " }}
126
+ {{- render_typescript_type(param_spec, tool.parameters.required or []) }}
127
+ {%- if param_spec.default is defined -%}
128
+ {%- if param_spec.enum %}
129
+ {{- ", // default: " + param_spec.default }}
130
+ {%- elif param_spec.oneOf %}
131
+ {{- "// default: " + param_spec.default }}
132
+ {%- else %}
133
+ {{- ", // default: " + param_spec.default|tojson }}
134
+ {%- endif -%}
135
+ {%- endif -%}
136
+ {%- if not loop.last %}
137
+ {{- ",\n" }}
138
+ {%- else %}
139
+ {{- ",\n" }}
140
+ {%- endif -%}
141
+ {%- endfor %}
142
+ {{- "}) => any;\n\n" }}
143
+ {%- else -%}
144
+ {{- "() => any;\n\n" }}
145
+ {%- endif -%}
146
+ {%- endfor %}
147
+ {{- "} // namespace " + namespace_name }}
148
+ {%- endmacro -%}
149
+
150
+ {%- macro render_builtin_tools(browser_tool, python_tool) -%}
151
+ {%- if browser_tool %}
152
+ {{- "## browser\n\n" }}
153
+ {{- "// Tool for browsing.\n" }}
154
+ {{- "// The `cursor` appears in brackets before each browsing display: `[{cursor}]`.\n" }}
155
+ {{- "// Cite information from the tool using the following format:\n" }}
156
+ {{- "// `【{cursor}†L{line_start}(-L{line_end})?】`, for example: `【6†L9-L11】` or `【8†L3】`.\n" }}
157
+ {{- "// Do not quote more than 10 words directly from the tool output.\n" }}
158
+ {{- "// sources=web (default: web)\n" }}
159
+ {{- "namespace browser {\n\n" }}
160
+ {{- "// Searches for information related to `query` and displays `topn` results.\n" }}
161
+ {{- "type search = (_: {\n" }}
162
+ {{- "query: string,\n" }}
163
+ {{- "topn?: number, // default: 10\n" }}
164
+ {{- "source?: string,\n" }}
165
+ {{- "}) => any;\n\n" }}
166
+ {{- "// Opens the link `id` from the page indicated by `cursor` starting at line number `loc`, showing `num_lines` lines.\n" }}
167
+ {{- "// Valid link ids are displayed with the formatting: `【{id}†.*】`.\n" }}
168
+ {{- "// If `cursor` is not provided, the most recent page is implied.\n" }}
169
+ {{- "// If `id` is a string, it is treated as a fully qualified URL associated with `source`.\n" }}
170
+ {{- "// If `loc` is not provided, the viewport will be positioned at the beginning of the document or centered on the most relevant passage, if available.\n" }}
171
+ {{- "// Use this function without `id` to scroll to a new location of an opened page.\n" }}
172
+ {{- "type open = (_: {\n" }}
173
+ {{- "id?: number | string, // default: -1\n" }}
174
+ {{- "cursor?: number, // default: -1\n" }}
175
+ {{- "loc?: number, // default: -1\n" }}
176
+ {{- "num_lines?: number, // default: -1\n" }}
177
+ {{- "view_source?: boolean, // default: false\n" }}
178
+ {{- "source?: string,\n" }}
179
+ {{- "}) => any;\n\n" }}
180
+ {{- "// Finds exact matches of `pattern` in the current page, or the page given by `cursor`.\n" }}
181
+ {{- "type find = (_: {\n" }}
182
+ {{- "pattern: string,\n" }}
183
+ {{- "cursor?: number, // default: -1\n" }}
184
+ {{- "}) => any;\n\n" }}
185
+ {{- "} // namespace browser\n\n" }}
186
+ {%- endif -%}
187
+
188
+ {%- if python_tool %}
189
+ {{- "## python\n\n" }}
190
+ {{- "Use this tool to execute Python code in your chain of thought. The code will not be shown to the user. This tool should be used for internal reasoning, but not for code that is intended to be visible to the user (e.g. when creating plots, tables, or files).\n\n" }}
191
+ {{- "When you send a message containing Python code to python, it will be executed in a stateful Jupyter notebook environment. python will respond with the output of the execution or time out after 120.0 seconds. The drive at '/mnt/data' can be used to save and persist user files. Internet access for this session is UNKNOWN. Depends on the cluster.\n\n" }}
192
+ {%- endif -%}
193
+ {%- endmacro -%}
194
+
195
+ {#- System Message Construction ============================================ #}
196
+ {%- macro build_system_message() -%}
197
+ {%- if model_identity is not defined %}
198
+ {%- set model_identity = "You are ChatGPT, a large language model trained by OpenAI." %}
199
+ {%- endif %}
200
+ {{- model_identity + "\n" }}
201
+ {{- "Knowledge cutoff: 2024-06\n" }}
202
+ {{- "Current date: " + strftime_now("%Y-%m-%d") + "\n\n" }}
203
+ {%- if reasoning_effort is not defined %}
204
+ {%- set reasoning_effort = "medium" %}
205
+ {%- endif %}
206
+ {{- "Reasoning: " + reasoning_effort + "\n\n" }}
207
+ {%- if builtin_tools %}
208
+ {{- "# Tools\n\n" }}
209
+ {%- set available_builtin_tools = namespace(browser=false, python=false) %}
210
+ {%- for tool in builtin_tools %}
211
+ {%- if tool == "browser" %}
212
+ {%- set available_builtin_tools.browser = true %}
213
+ {%- elif tool == "python" %}
214
+ {%- set available_builtin_tools.python = true %}
215
+ {%- endif %}
216
+ {%- endfor %}
217
+ {{- render_builtin_tools(available_builtin_tools.browser, available_builtin_tools.python) }}
218
+ {%- endif -%}
219
+ {{- "# Valid channels: analysis, commentary, final. Channel must be included for every message." }}
220
+ {%- if tools -%}
221
+ {{- "\nCalls to these tools must go to the commentary channel: 'functions'." }}
222
+ {%- endif -%}
223
+ {%- endmacro -%}
224
+
225
+ {#- Main Template Logic ================================================= #}
226
+ {#- Set defaults #}
227
+
228
+ {#- Render system message #}
229
+ {{- "<|start|>system<|message|>" }}
230
+ {{- build_system_message() }}
231
+ {{- "<|end|>" }}
232
+
233
+ {#- Extract developer message #}
234
+ {%- if messages[0].role == "developer" or messages[0].role == "system" %}
235
+ {%- set developer_message = messages[0].content %}
236
+ {%- set loop_messages = messages[1:] %}
237
+ {%- else %}
238
+ {%- set developer_message = "" %}
239
+ {%- set loop_messages = messages %}
240
+ {%- endif %}
241
+
242
+ {#- Render developer message #}
243
+ {%- if developer_message or tools %}
244
+ {{- "<|start|>developer<|message|>" }}
245
+ {%- if developer_message %}
246
+ {{- "# Instructions\n\n" }}
247
+ {{- developer_message }}
248
+ {{- "\n\n" }}
249
+ {%- endif %}
250
+ {%- if tools -%}
251
+ {{- "# Tools\n\n" }}
252
+ {{- render_tool_namespace("functions", tools) }}
253
+ {%- endif -%}
254
+ {{- "<|end|>" }}
255
+ {%- endif %}
256
+
257
+ {#- Render messages #}
258
+ {%- set last_tool_call = namespace(name=none) %}
259
+ {%- for message in loop_messages -%}
260
+ {#- At this point only assistant/user/tool messages should remain #}
261
+ {%- if message.role == 'assistant' -%}
262
+ {#- Checks to ensure the messages are being passed in the format we expect #}
263
+ {%- if "content" in message %}
264
+ {%- if "<|channel|>analysis<|message|>" in message.content or "<|channel|>final<|message|>" in message.content %}
265
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the content field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
266
+ {%- endif %}
267
+ {%- endif %}
268
+ {%- if "thinking" in message %}
269
+ {%- if "<|channel|>analysis<|message|>" in message.thinking or "<|channel|>final<|message|>" in message.thinking %}
270
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the thinking field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
271
+ {%- endif %}
272
+ {%- endif %}
273
+ {%- if "tool_calls" in message %}
274
+ {#- We need very careful handling here - we want to drop the tool call analysis message if the model #}
275
+ {#- has output a later <|final|> message, but otherwise we want to retain it. This is the only case #}
276
+ {#- when we render CoT/analysis messages in inference. #}
277
+ {%- set future_final_message = namespace(found=false) %}
278
+ {%- for future_message in loop_messages[loop.index:] %}
279
+ {%- if future_message.role == 'assistant' and "tool_calls" not in future_message %}
280
+ {%- set future_final_message.found = true %}
281
+ {%- endif %}
282
+ {%- endfor %}
283
+ {#- We assume max 1 tool call per message, and so we infer the tool call name #}
284
+ {#- in "tool" messages from the most recent assistant tool call name #}
285
+ {%- set tool_call = message.tool_calls[0] %}
286
+ {%- if tool_call.function %}
287
+ {%- set tool_call = tool_call.function %}
288
+ {%- endif %}
289
+ {%- if message.content and message.thinking %}
290
+ {{- raise_exception("Cannot pass both content and thinking in an assistant message with tool calls! Put the analysis message in one or the other, but not both.") }}
291
+ {%- elif message.content and not future_final_message.found %}
292
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.content + "<|end|>" }}
293
+ {%- elif message.thinking and not future_final_message.found %}
294
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
295
+ {%- endif %}
296
+ {{- "<|start|>assistant to=" }}
297
+ {{- "functions." + tool_call.name + "<|channel|>commentary " }}
298
+ {{- (tool_call.content_type if tool_call.content_type is defined else "json") + "<|message|>" }}
299
+ {{- tool_call.arguments|tojson }}
300
+ {{- "<|call|>" }}
301
+ {%- set last_tool_call.name = tool_call.name %}
302
+ {%- elif loop.last and not add_generation_prompt %}
303
+ {#- Only render the CoT if the final turn is an assistant turn and add_generation_prompt is false #}
304
+ {#- This is a situation that should only occur in training, never in inference. #}
305
+ {%- if "thinking" in message %}
306
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
307
+ {%- endif %}
308
+ {#- <|return|> indicates the end of generation, but <|end|> does not #}
309
+ {#- <|return|> should never be an input to the model, but we include it as the final token #}
310
+ {#- when training, so the model learns to emit it. #}
311
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|return|>" }}
312
+ {%- else %}
313
+ {#- CoT is dropped during all previous turns, so we never render it for inference #}
314
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|end|>" }}
315
+ {%- set last_tool_call.name = none %}
316
+ {%- endif %}
317
+ {%- elif message.role == 'tool' -%}
318
+ {%- if last_tool_call.name is none %}
319
+ {{- raise_exception("Message has tool role, but there was no previous assistant message with a tool call!") }}
320
+ {%- endif %}
321
+ {{- "<|start|>functions." + last_tool_call.name }}
322
+ {{- " to=assistant<|channel|>commentary<|message|>" + message.content|tojson + "<|end|>" }}
323
+ {%- elif message.role == 'user' -%}
324
+ {{- "<|start|>user<|message|>" + message.content + "<|end|>" }}
325
+ {%- endif -%}
326
+ {%- endfor -%}
327
+
328
+ {#- Generation prompt #}
329
+ {%- if add_generation_prompt -%}
330
+ <|start|>assistant
331
+ {%- endif -%}
checkpoint-1642/README.md ADDED
@@ -0,0 +1,208 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: openai/gpt-oss-20b
3
+ library_name: peft
4
+ tags:
5
+ - base_model:adapter:openai/gpt-oss-20b
6
+ - lora
7
+ - sft
8
+ - transformers
9
+ - trl
10
+ ---
11
+
12
+ # Model Card for Model ID
13
+
14
+ <!-- Provide a quick summary of what the model is/does. -->
15
+
16
+
17
+
18
+ ## Model Details
19
+
20
+ ### Model Description
21
+
22
+ <!-- Provide a longer summary of what this model is. -->
23
+
24
+
25
+
26
+ - **Developed by:** [More Information Needed]
27
+ - **Funded by [optional]:** [More Information Needed]
28
+ - **Shared by [optional]:** [More Information Needed]
29
+ - **Model type:** [More Information Needed]
30
+ - **Language(s) (NLP):** [More Information Needed]
31
+ - **License:** [More Information Needed]
32
+ - **Finetuned from model [optional]:** [More Information Needed]
33
+
34
+ ### Model Sources [optional]
35
+
36
+ <!-- Provide the basic links for the model. -->
37
+
38
+ - **Repository:** [More Information Needed]
39
+ - **Paper [optional]:** [More Information Needed]
40
+ - **Demo [optional]:** [More Information Needed]
41
+
42
+ ## Uses
43
+
44
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
45
+
46
+ ### Direct Use
47
+
48
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
49
+
50
+ [More Information Needed]
51
+
52
+ ### Downstream Use [optional]
53
+
54
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
55
+
56
+ [More Information Needed]
57
+
58
+ ### Out-of-Scope Use
59
+
60
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
61
+
62
+ [More Information Needed]
63
+
64
+ ## Bias, Risks, and Limitations
65
+
66
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
67
+
68
+ [More Information Needed]
69
+
70
+ ### Recommendations
71
+
72
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
73
+
74
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
75
+
76
+ ## How to Get Started with the Model
77
+
78
+ Use the code below to get started with the model.
79
+
80
+ [More Information Needed]
81
+
82
+ ## Training Details
83
+
84
+ ### Training Data
85
+
86
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
87
+
88
+ [More Information Needed]
89
+
90
+ ### Training Procedure
91
+
92
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
93
+
94
+ #### Preprocessing [optional]
95
+
96
+ [More Information Needed]
97
+
98
+
99
+ #### Training Hyperparameters
100
+
101
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
102
+
103
+ #### Speeds, Sizes, Times [optional]
104
+
105
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
106
+
107
+ [More Information Needed]
108
+
109
+ ## Evaluation
110
+
111
+ <!-- This section describes the evaluation protocols and provides the results. -->
112
+
113
+ ### Testing Data, Factors & Metrics
114
+
115
+ #### Testing Data
116
+
117
+ <!-- This should link to a Dataset Card if possible. -->
118
+
119
+ [More Information Needed]
120
+
121
+ #### Factors
122
+
123
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
124
+
125
+ [More Information Needed]
126
+
127
+ #### Metrics
128
+
129
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
130
+
131
+ [More Information Needed]
132
+
133
+ ### Results
134
+
135
+ [More Information Needed]
136
+
137
+ #### Summary
138
+
139
+
140
+
141
+ ## Model Examination [optional]
142
+
143
+ <!-- Relevant interpretability work for the model goes here -->
144
+
145
+ [More Information Needed]
146
+
147
+ ## Environmental Impact
148
+
149
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
150
+
151
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
152
+
153
+ - **Hardware Type:** [More Information Needed]
154
+ - **Hours used:** [More Information Needed]
155
+ - **Cloud Provider:** [More Information Needed]
156
+ - **Compute Region:** [More Information Needed]
157
+ - **Carbon Emitted:** [More Information Needed]
158
+
159
+ ## Technical Specifications [optional]
160
+
161
+ ### Model Architecture and Objective
162
+
163
+ [More Information Needed]
164
+
165
+ ### Compute Infrastructure
166
+
167
+ [More Information Needed]
168
+
169
+ #### Hardware
170
+
171
+ [More Information Needed]
172
+
173
+ #### Software
174
+
175
+ [More Information Needed]
176
+
177
+ ## Citation [optional]
178
+
179
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
180
+
181
+ **BibTeX:**
182
+
183
+ [More Information Needed]
184
+
185
+ **APA:**
186
+
187
+ [More Information Needed]
188
+
189
+ ## Glossary [optional]
190
+
191
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
192
+
193
+ [More Information Needed]
194
+
195
+ ## More Information [optional]
196
+
197
+ [More Information Needed]
198
+
199
+ ## Model Card Authors [optional]
200
+
201
+ [More Information Needed]
202
+
203
+ ## Model Card Contact
204
+
205
+ [More Information Needed]
206
+ ### Framework versions
207
+
208
+ - PEFT 0.17.1
checkpoint-1642/adapter_config.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "GptOssForCausalLM",
5
+ "parent_library": "transformers.models.gpt_oss.modeling_gpt_oss"
6
+ },
7
+ "base_model_name_or_path": "openai/gpt-oss-20b",
8
+ "bias": "none",
9
+ "corda_config": null,
10
+ "eva_config": null,
11
+ "exclude_modules": null,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": true,
15
+ "layer_replication": null,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "loftq_config": {},
19
+ "lora_alpha": 16,
20
+ "lora_bias": false,
21
+ "lora_dropout": 0.0,
22
+ "megatron_config": null,
23
+ "megatron_core": "megatron.core",
24
+ "modules_to_save": null,
25
+ "peft_type": "LORA",
26
+ "qalora_group_size": 16,
27
+ "r": 8,
28
+ "rank_pattern": {},
29
+ "revision": null,
30
+ "target_modules": [
31
+ "o_proj",
32
+ "k_proj",
33
+ "v_proj",
34
+ "q_proj"
35
+ ],
36
+ "target_parameters": [
37
+ "7.mlp.experts.gate_up_proj",
38
+ "7.mlp.experts.down_proj",
39
+ "15.mlp.experts.gate_up_proj",
40
+ "15.mlp.experts.down_proj",
41
+ "23.mlp.experts.gate_up_proj",
42
+ "23.mlp.experts.down_proj"
43
+ ],
44
+ "task_type": null,
45
+ "trainable_token_indices": null,
46
+ "use_dora": false,
47
+ "use_qalora": false,
48
+ "use_rslora": false
49
+ }
checkpoint-1642/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a2bb30c52c7bdb0a748ad8bac39bd5ca2c2eea8c78a335188ddff323f2fbdd4
3
+ size 2366470368
checkpoint-1642/chat_template.jinja ADDED
@@ -0,0 +1,331 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {#-
2
+ In addition to the normal inputs of `messages` and `tools`, this template also accepts the
3
+ following kwargs:
4
+ - "builtin_tools": A list, can contain "browser" and/or "python".
5
+ - "model_identity": A string that optionally describes the model identity.
6
+ - "reasoning_effort": A string that describes the reasoning effort, defaults to "medium".
7
+ #}
8
+
9
+ {#- Tool Definition Rendering ============================================== #}
10
+ {%- macro render_typescript_type(param_spec, required_params, is_nullable=false) -%}
11
+ {%- if param_spec.type == "array" -%}
12
+ {%- if param_spec['items'] -%}
13
+ {%- if param_spec['items']['type'] == "string" -%}
14
+ {{- "string[]" }}
15
+ {%- elif param_spec['items']['type'] == "number" -%}
16
+ {{- "number[]" }}
17
+ {%- elif param_spec['items']['type'] == "integer" -%}
18
+ {{- "number[]" }}
19
+ {%- elif param_spec['items']['type'] == "boolean" -%}
20
+ {{- "boolean[]" }}
21
+ {%- else -%}
22
+ {%- set inner_type = render_typescript_type(param_spec['items'], required_params) -%}
23
+ {%- if inner_type == "object | object" or inner_type|length > 50 -%}
24
+ {{- "any[]" }}
25
+ {%- else -%}
26
+ {{- inner_type + "[]" }}
27
+ {%- endif -%}
28
+ {%- endif -%}
29
+ {%- if param_spec.nullable -%}
30
+ {{- " | null" }}
31
+ {%- endif -%}
32
+ {%- else -%}
33
+ {{- "any[]" }}
34
+ {%- if param_spec.nullable -%}
35
+ {{- " | null" }}
36
+ {%- endif -%}
37
+ {%- endif -%}
38
+ {%- elif param_spec.type is defined and param_spec.type is iterable and param_spec.type is not string and param_spec.type is not mapping and param_spec.type[0] is defined -%}
39
+ {#- Handle array of types like ["object", "object"] from Union[dict, list] #}
40
+ {%- if param_spec.type | length > 1 -%}
41
+ {{- param_spec.type | join(" | ") }}
42
+ {%- else -%}
43
+ {{- param_spec.type[0] }}
44
+ {%- endif -%}
45
+ {%- elif param_spec.oneOf -%}
46
+ {#- Handle oneOf schemas - check for complex unions and fallback to any #}
47
+ {%- set has_object_variants = false -%}
48
+ {%- for variant in param_spec.oneOf -%}
49
+ {%- if variant.type == "object" -%}
50
+ {%- set has_object_variants = true -%}
51
+ {%- endif -%}
52
+ {%- endfor -%}
53
+ {%- if has_object_variants and param_spec.oneOf|length > 1 -%}
54
+ {{- "any" }}
55
+ {%- else -%}
56
+ {%- for variant in param_spec.oneOf -%}
57
+ {{- render_typescript_type(variant, required_params) -}}
58
+ {%- if variant.description %}
59
+ {{- "// " + variant.description }}
60
+ {%- endif -%}
61
+ {%- if variant.default is defined %}
62
+ {{ "// default: " + variant.default|tojson }}
63
+ {%- endif -%}
64
+ {%- if not loop.last %}
65
+ {{- " | " }}
66
+ {% endif -%}
67
+ {%- endfor -%}
68
+ {%- endif -%}
69
+ {%- elif param_spec.type == "string" -%}
70
+ {%- if param_spec.enum -%}
71
+ {{- '"' + param_spec.enum|join('" | "') + '"' -}}
72
+ {%- else -%}
73
+ {{- "string" }}
74
+ {%- if param_spec.nullable %}
75
+ {{- " | null" }}
76
+ {%- endif -%}
77
+ {%- endif -%}
78
+ {%- elif param_spec.type == "number" -%}
79
+ {{- "number" }}
80
+ {%- elif param_spec.type == "integer" -%}
81
+ {{- "number" }}
82
+ {%- elif param_spec.type == "boolean" -%}
83
+ {{- "boolean" }}
84
+
85
+ {%- elif param_spec.type == "object" -%}
86
+ {%- if param_spec.properties -%}
87
+ {{- "{\n" }}
88
+ {%- for prop_name, prop_spec in param_spec.properties.items() -%}
89
+ {{- prop_name -}}
90
+ {%- if prop_name not in (param_spec.required or []) -%}
91
+ {{- "?" }}
92
+ {%- endif -%}
93
+ {{- ": " }}
94
+ {{ render_typescript_type(prop_spec, param_spec.required or []) }}
95
+ {%- if not loop.last -%}
96
+ {{-", " }}
97
+ {%- endif -%}
98
+ {%- endfor -%}
99
+ {{- "}" }}
100
+ {%- else -%}
101
+ {{- "object" }}
102
+ {%- endif -%}
103
+ {%- else -%}
104
+ {{- "any" }}
105
+ {%- endif -%}
106
+ {%- endmacro -%}
107
+
108
+ {%- macro render_tool_namespace(namespace_name, tools) -%}
109
+ {{- "## " + namespace_name + "\n\n" }}
110
+ {{- "namespace " + namespace_name + " {\n\n" }}
111
+ {%- for tool in tools %}
112
+ {%- set tool = tool.function %}
113
+ {{- "// " + tool.description + "\n" }}
114
+ {{- "type "+ tool.name + " = " }}
115
+ {%- if tool.parameters and tool.parameters.properties %}
116
+ {{- "(_: {\n" }}
117
+ {%- for param_name, param_spec in tool.parameters.properties.items() %}
118
+ {%- if param_spec.description %}
119
+ {{- "// " + param_spec.description + "\n" }}
120
+ {%- endif %}
121
+ {{- param_name }}
122
+ {%- if param_name not in (tool.parameters.required or []) -%}
123
+ {{- "?" }}
124
+ {%- endif -%}
125
+ {{- ": " }}
126
+ {{- render_typescript_type(param_spec, tool.parameters.required or []) }}
127
+ {%- if param_spec.default is defined -%}
128
+ {%- if param_spec.enum %}
129
+ {{- ", // default: " + param_spec.default }}
130
+ {%- elif param_spec.oneOf %}
131
+ {{- "// default: " + param_spec.default }}
132
+ {%- else %}
133
+ {{- ", // default: " + param_spec.default|tojson }}
134
+ {%- endif -%}
135
+ {%- endif -%}
136
+ {%- if not loop.last %}
137
+ {{- ",\n" }}
138
+ {%- else %}
139
+ {{- ",\n" }}
140
+ {%- endif -%}
141
+ {%- endfor %}
142
+ {{- "}) => any;\n\n" }}
143
+ {%- else -%}
144
+ {{- "() => any;\n\n" }}
145
+ {%- endif -%}
146
+ {%- endfor %}
147
+ {{- "} // namespace " + namespace_name }}
148
+ {%- endmacro -%}
149
+
150
+ {%- macro render_builtin_tools(browser_tool, python_tool) -%}
151
+ {%- if browser_tool %}
152
+ {{- "## browser\n\n" }}
153
+ {{- "// Tool for browsing.\n" }}
154
+ {{- "// The `cursor` appears in brackets before each browsing display: `[{cursor}]`.\n" }}
155
+ {{- "// Cite information from the tool using the following format:\n" }}
156
+ {{- "// `【{cursor}†L{line_start}(-L{line_end})?】`, for example: `【6†L9-L11】` or `【8†L3】`.\n" }}
157
+ {{- "// Do not quote more than 10 words directly from the tool output.\n" }}
158
+ {{- "// sources=web (default: web)\n" }}
159
+ {{- "namespace browser {\n\n" }}
160
+ {{- "// Searches for information related to `query` and displays `topn` results.\n" }}
161
+ {{- "type search = (_: {\n" }}
162
+ {{- "query: string,\n" }}
163
+ {{- "topn?: number, // default: 10\n" }}
164
+ {{- "source?: string,\n" }}
165
+ {{- "}) => any;\n\n" }}
166
+ {{- "// Opens the link `id` from the page indicated by `cursor` starting at line number `loc`, showing `num_lines` lines.\n" }}
167
+ {{- "// Valid link ids are displayed with the formatting: `【{id}†.*】`.\n" }}
168
+ {{- "// If `cursor` is not provided, the most recent page is implied.\n" }}
169
+ {{- "// If `id` is a string, it is treated as a fully qualified URL associated with `source`.\n" }}
170
+ {{- "// If `loc` is not provided, the viewport will be positioned at the beginning of the document or centered on the most relevant passage, if available.\n" }}
171
+ {{- "// Use this function without `id` to scroll to a new location of an opened page.\n" }}
172
+ {{- "type open = (_: {\n" }}
173
+ {{- "id?: number | string, // default: -1\n" }}
174
+ {{- "cursor?: number, // default: -1\n" }}
175
+ {{- "loc?: number, // default: -1\n" }}
176
+ {{- "num_lines?: number, // default: -1\n" }}
177
+ {{- "view_source?: boolean, // default: false\n" }}
178
+ {{- "source?: string,\n" }}
179
+ {{- "}) => any;\n\n" }}
180
+ {{- "// Finds exact matches of `pattern` in the current page, or the page given by `cursor`.\n" }}
181
+ {{- "type find = (_: {\n" }}
182
+ {{- "pattern: string,\n" }}
183
+ {{- "cursor?: number, // default: -1\n" }}
184
+ {{- "}) => any;\n\n" }}
185
+ {{- "} // namespace browser\n\n" }}
186
+ {%- endif -%}
187
+
188
+ {%- if python_tool %}
189
+ {{- "## python\n\n" }}
190
+ {{- "Use this tool to execute Python code in your chain of thought. The code will not be shown to the user. This tool should be used for internal reasoning, but not for code that is intended to be visible to the user (e.g. when creating plots, tables, or files).\n\n" }}
191
+ {{- "When you send a message containing Python code to python, it will be executed in a stateful Jupyter notebook environment. python will respond with the output of the execution or time out after 120.0 seconds. The drive at '/mnt/data' can be used to save and persist user files. Internet access for this session is UNKNOWN. Depends on the cluster.\n\n" }}
192
+ {%- endif -%}
193
+ {%- endmacro -%}
194
+
195
+ {#- System Message Construction ============================================ #}
196
+ {%- macro build_system_message() -%}
197
+ {%- if model_identity is not defined %}
198
+ {%- set model_identity = "You are ChatGPT, a large language model trained by OpenAI." %}
199
+ {%- endif %}
200
+ {{- model_identity + "\n" }}
201
+ {{- "Knowledge cutoff: 2024-06\n" }}
202
+ {{- "Current date: " + strftime_now("%Y-%m-%d") + "\n\n" }}
203
+ {%- if reasoning_effort is not defined %}
204
+ {%- set reasoning_effort = "medium" %}
205
+ {%- endif %}
206
+ {{- "Reasoning: " + reasoning_effort + "\n\n" }}
207
+ {%- if builtin_tools %}
208
+ {{- "# Tools\n\n" }}
209
+ {%- set available_builtin_tools = namespace(browser=false, python=false) %}
210
+ {%- for tool in builtin_tools %}
211
+ {%- if tool == "browser" %}
212
+ {%- set available_builtin_tools.browser = true %}
213
+ {%- elif tool == "python" %}
214
+ {%- set available_builtin_tools.python = true %}
215
+ {%- endif %}
216
+ {%- endfor %}
217
+ {{- render_builtin_tools(available_builtin_tools.browser, available_builtin_tools.python) }}
218
+ {%- endif -%}
219
+ {{- "# Valid channels: analysis, commentary, final. Channel must be included for every message." }}
220
+ {%- if tools -%}
221
+ {{- "\nCalls to these tools must go to the commentary channel: 'functions'." }}
222
+ {%- endif -%}
223
+ {%- endmacro -%}
224
+
225
+ {#- Main Template Logic ================================================= #}
226
+ {#- Set defaults #}
227
+
228
+ {#- Render system message #}
229
+ {{- "<|start|>system<|message|>" }}
230
+ {{- build_system_message() }}
231
+ {{- "<|end|>" }}
232
+
233
+ {#- Extract developer message #}
234
+ {%- if messages[0].role == "developer" or messages[0].role == "system" %}
235
+ {%- set developer_message = messages[0].content %}
236
+ {%- set loop_messages = messages[1:] %}
237
+ {%- else %}
238
+ {%- set developer_message = "" %}
239
+ {%- set loop_messages = messages %}
240
+ {%- endif %}
241
+
242
+ {#- Render developer message #}
243
+ {%- if developer_message or tools %}
244
+ {{- "<|start|>developer<|message|>" }}
245
+ {%- if developer_message %}
246
+ {{- "# Instructions\n\n" }}
247
+ {{- developer_message }}
248
+ {{- "\n\n" }}
249
+ {%- endif %}
250
+ {%- if tools -%}
251
+ {{- "# Tools\n\n" }}
252
+ {{- render_tool_namespace("functions", tools) }}
253
+ {%- endif -%}
254
+ {{- "<|end|>" }}
255
+ {%- endif %}
256
+
257
+ {#- Render messages #}
258
+ {%- set last_tool_call = namespace(name=none) %}
259
+ {%- for message in loop_messages -%}
260
+ {#- At this point only assistant/user/tool messages should remain #}
261
+ {%- if message.role == 'assistant' -%}
262
+ {#- Checks to ensure the messages are being passed in the format we expect #}
263
+ {%- if "content" in message %}
264
+ {%- if "<|channel|>analysis<|message|>" in message.content or "<|channel|>final<|message|>" in message.content %}
265
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the content field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
266
+ {%- endif %}
267
+ {%- endif %}
268
+ {%- if "thinking" in message %}
269
+ {%- if "<|channel|>analysis<|message|>" in message.thinking or "<|channel|>final<|message|>" in message.thinking %}
270
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the thinking field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
271
+ {%- endif %}
272
+ {%- endif %}
273
+ {%- if "tool_calls" in message %}
274
+ {#- We need very careful handling here - we want to drop the tool call analysis message if the model #}
275
+ {#- has output a later <|final|> message, but otherwise we want to retain it. This is the only case #}
276
+ {#- when we render CoT/analysis messages in inference. #}
277
+ {%- set future_final_message = namespace(found=false) %}
278
+ {%- for future_message in loop_messages[loop.index:] %}
279
+ {%- if future_message.role == 'assistant' and "tool_calls" not in future_message %}
280
+ {%- set future_final_message.found = true %}
281
+ {%- endif %}
282
+ {%- endfor %}
283
+ {#- We assume max 1 tool call per message, and so we infer the tool call name #}
284
+ {#- in "tool" messages from the most recent assistant tool call name #}
285
+ {%- set tool_call = message.tool_calls[0] %}
286
+ {%- if tool_call.function %}
287
+ {%- set tool_call = tool_call.function %}
288
+ {%- endif %}
289
+ {%- if message.content and message.thinking %}
290
+ {{- raise_exception("Cannot pass both content and thinking in an assistant message with tool calls! Put the analysis message in one or the other, but not both.") }}
291
+ {%- elif message.content and not future_final_message.found %}
292
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.content + "<|end|>" }}
293
+ {%- elif message.thinking and not future_final_message.found %}
294
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
295
+ {%- endif %}
296
+ {{- "<|start|>assistant to=" }}
297
+ {{- "functions." + tool_call.name + "<|channel|>commentary " }}
298
+ {{- (tool_call.content_type if tool_call.content_type is defined else "json") + "<|message|>" }}
299
+ {{- tool_call.arguments|tojson }}
300
+ {{- "<|call|>" }}
301
+ {%- set last_tool_call.name = tool_call.name %}
302
+ {%- elif loop.last and not add_generation_prompt %}
303
+ {#- Only render the CoT if the final turn is an assistant turn and add_generation_prompt is false #}
304
+ {#- This is a situation that should only occur in training, never in inference. #}
305
+ {%- if "thinking" in message %}
306
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
307
+ {%- endif %}
308
+ {#- <|return|> indicates the end of generation, but <|end|> does not #}
309
+ {#- <|return|> should never be an input to the model, but we include it as the final token #}
310
+ {#- when training, so the model learns to emit it. #}
311
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|return|>" }}
312
+ {%- else %}
313
+ {#- CoT is dropped during all previous turns, so we never render it for inference #}
314
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|end|>" }}
315
+ {%- set last_tool_call.name = none %}
316
+ {%- endif %}
317
+ {%- elif message.role == 'tool' -%}
318
+ {%- if last_tool_call.name is none %}
319
+ {{- raise_exception("Message has tool role, but there was no previous assistant message with a tool call!") }}
320
+ {%- endif %}
321
+ {{- "<|start|>functions." + last_tool_call.name }}
322
+ {{- " to=assistant<|channel|>commentary<|message|>" + message.content|tojson + "<|end|>" }}
323
+ {%- elif message.role == 'user' -%}
324
+ {{- "<|start|>user<|message|>" + message.content + "<|end|>" }}
325
+ {%- endif -%}
326
+ {%- endfor -%}
327
+
328
+ {#- Generation prompt #}
329
+ {%- if add_generation_prompt -%}
330
+ <|start|>assistant
331
+ {%- endif -%}
checkpoint-1642/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa8c076a2c7a54274c3e6fea5b408ff597f64186f832c0921c0fc4ac90a90646
3
+ size 120495883
checkpoint-1642/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8f92cf63e0989759370d24108b469c492c12202403f036015307ce49f12cedc
3
+ size 16389
checkpoint-1642/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ed40a0a4e9f365d2c6cc004d97e6705894eba46c8be4c160c1455bc3062dee1
3
+ size 16389
checkpoint-1642/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d688b304d19c260b5cfa471535ed51d7e1d60b3a0d0159dfd1a04b87904a9f42
3
+ size 16389
checkpoint-1642/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9967425ebcaee80d9b518fa0244d52f739b1b983d87cda71d5fede0c073e9d3b
3
+ size 16389
checkpoint-1642/rng_state_4.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:469900fd39c667ffbd49c3c407c0ba317a1e9f5f9339a99b5d38423b7d0ce6d4
3
+ size 16389
checkpoint-1642/rng_state_5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:124688471ff2a6e80f2fcefedbf741fb18d08dd539d5bd07a52e81be545142a5
3
+ size 16389
checkpoint-1642/rng_state_6.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e69f1ced9f992a72c948698e5eb06088610788988cdb2fdbdd624e064319d60
3
+ size 16389
checkpoint-1642/rng_state_7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a376268a55d6ee10c371c06aa952334c4c6a1af9ea2d71b1951a57367a0c6722
3
+ size 16389
checkpoint-1642/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dc6cc730a04732028e5e99bd0647de7bc952d3bd8bafab1e763ff61ef93625d
3
+ size 1465
checkpoint-1642/special_tokens_map.json ADDED
@@ -0,0 +1,1817 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "AAD",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ {
11
+ "content": "AArch64",
12
+ "lstrip": false,
13
+ "normalized": false,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ {
18
+ "content": "ACL",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ },
24
+ {
25
+ "content": "AD",
26
+ "lstrip": false,
27
+ "normalized": false,
28
+ "rstrip": false,
29
+ "single_word": false
30
+ },
31
+ {
32
+ "content": "AES",
33
+ "lstrip": false,
34
+ "normalized": false,
35
+ "rstrip": false,
36
+ "single_word": false
37
+ },
38
+ {
39
+ "content": "AES256GCM",
40
+ "lstrip": false,
41
+ "normalized": false,
42
+ "rstrip": false,
43
+ "single_word": false
44
+ },
45
+ {
46
+ "content": "AESCBC",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false
51
+ },
52
+ {
53
+ "content": "AKE",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false
58
+ },
59
+ {
60
+ "content": "AON",
61
+ "lstrip": false,
62
+ "normalized": false,
63
+ "rstrip": false,
64
+ "single_word": false
65
+ },
66
+ {
67
+ "content": "ASID",
68
+ "lstrip": false,
69
+ "normalized": false,
70
+ "rstrip": false,
71
+ "single_word": false
72
+ },
73
+ {
74
+ "content": "AXI",
75
+ "lstrip": false,
76
+ "normalized": false,
77
+ "rstrip": false,
78
+ "single_word": false
79
+ },
80
+ {
81
+ "content": "Acronym",
82
+ "lstrip": false,
83
+ "normalized": false,
84
+ "rstrip": false,
85
+ "single_word": false
86
+ },
87
+ {
88
+ "content": "AoU",
89
+ "lstrip": false,
90
+ "normalized": false,
91
+ "rstrip": false,
92
+ "single_word": false
93
+ },
94
+ {
95
+ "content": "AutoSar",
96
+ "lstrip": false,
97
+ "normalized": false,
98
+ "rstrip": false,
99
+ "single_word": false
100
+ },
101
+ {
102
+ "content": "BAM",
103
+ "lstrip": false,
104
+ "normalized": false,
105
+ "rstrip": false,
106
+ "single_word": false
107
+ },
108
+ {
109
+ "content": "BCH",
110
+ "lstrip": false,
111
+ "normalized": false,
112
+ "rstrip": false,
113
+ "single_word": false
114
+ },
115
+ {
116
+ "content": "BIST",
117
+ "lstrip": false,
118
+ "normalized": false,
119
+ "rstrip": false,
120
+ "single_word": false
121
+ },
122
+ {
123
+ "content": "BOM",
124
+ "lstrip": false,
125
+ "normalized": false,
126
+ "rstrip": false,
127
+ "single_word": false
128
+ },
129
+ {
130
+ "content": "BPMP",
131
+ "lstrip": false,
132
+ "normalized": false,
133
+ "rstrip": false,
134
+ "single_word": false
135
+ },
136
+ {
137
+ "content": "BPS",
138
+ "lstrip": false,
139
+ "normalized": false,
140
+ "rstrip": false,
141
+ "single_word": false
142
+ },
143
+ {
144
+ "content": "BPU",
145
+ "lstrip": false,
146
+ "normalized": false,
147
+ "rstrip": false,
148
+ "single_word": false
149
+ },
150
+ {
151
+ "content": "BRBCT",
152
+ "lstrip": false,
153
+ "normalized": false,
154
+ "rstrip": false,
155
+ "single_word": false
156
+ },
157
+ {
158
+ "content": "BW",
159
+ "lstrip": false,
160
+ "normalized": false,
161
+ "rstrip": false,
162
+ "single_word": false
163
+ },
164
+ {
165
+ "content": "C2C",
166
+ "lstrip": false,
167
+ "normalized": false,
168
+ "rstrip": false,
169
+ "single_word": false
170
+ },
171
+ {
172
+ "content": "CA",
173
+ "lstrip": false,
174
+ "normalized": false,
175
+ "rstrip": false,
176
+ "single_word": false
177
+ },
178
+ {
179
+ "content": "CAN",
180
+ "lstrip": false,
181
+ "normalized": false,
182
+ "rstrip": false,
183
+ "single_word": false
184
+ },
185
+ {
186
+ "content": "CANFD",
187
+ "lstrip": false,
188
+ "normalized": false,
189
+ "rstrip": false,
190
+ "single_word": false
191
+ },
192
+ {
193
+ "content": "CAR",
194
+ "lstrip": false,
195
+ "normalized": false,
196
+ "rstrip": false,
197
+ "single_word": false
198
+ },
199
+ {
200
+ "content": "CAVP",
201
+ "lstrip": false,
202
+ "normalized": false,
203
+ "rstrip": false,
204
+ "single_word": false
205
+ },
206
+ {
207
+ "content": "CBB",
208
+ "lstrip": false,
209
+ "normalized": false,
210
+ "rstrip": false,
211
+ "single_word": false
212
+ },
213
+ {
214
+ "content": "CBC",
215
+ "lstrip": false,
216
+ "normalized": false,
217
+ "rstrip": false,
218
+ "single_word": false
219
+ },
220
+ {
221
+ "content": "CBR",
222
+ "lstrip": false,
223
+ "normalized": false,
224
+ "rstrip": false,
225
+ "single_word": false
226
+ },
227
+ {
228
+ "content": "CCM",
229
+ "lstrip": false,
230
+ "normalized": false,
231
+ "rstrip": false,
232
+ "single_word": false
233
+ },
234
+ {
235
+ "content": "CCPLEX",
236
+ "lstrip": false,
237
+ "normalized": false,
238
+ "rstrip": false,
239
+ "single_word": false
240
+ },
241
+ {
242
+ "content": "CCPLEX_L2",
243
+ "lstrip": false,
244
+ "normalized": false,
245
+ "rstrip": false,
246
+ "single_word": false
247
+ },
248
+ {
249
+ "content": "CCPLEX_MISC",
250
+ "lstrip": false,
251
+ "normalized": false,
252
+ "rstrip": false,
253
+ "single_word": false
254
+ },
255
+ {
256
+ "content": "CCPLEX_SCF",
257
+ "lstrip": false,
258
+ "normalized": false,
259
+ "rstrip": false,
260
+ "single_word": false
261
+ },
262
+ {
263
+ "content": "CDD",
264
+ "lstrip": false,
265
+ "normalized": false,
266
+ "rstrip": false,
267
+ "single_word": false
268
+ },
269
+ {
270
+ "content": "CIF",
271
+ "lstrip": false,
272
+ "normalized": false,
273
+ "rstrip": false,
274
+ "single_word": false
275
+ },
276
+ {
277
+ "content": "CMAC",
278
+ "lstrip": false,
279
+ "normalized": false,
280
+ "rstrip": false,
281
+ "single_word": false
282
+ },
283
+ {
284
+ "content": "CPE",
285
+ "lstrip": false,
286
+ "normalized": false,
287
+ "rstrip": false,
288
+ "single_word": false
289
+ },
290
+ {
291
+ "content": "CPU",
292
+ "lstrip": false,
293
+ "normalized": false,
294
+ "rstrip": false,
295
+ "single_word": false
296
+ },
297
+ {
298
+ "content": "CRC",
299
+ "lstrip": false,
300
+ "normalized": false,
301
+ "rstrip": false,
302
+ "single_word": false
303
+ },
304
+ {
305
+ "content": "CSI",
306
+ "lstrip": false,
307
+ "normalized": false,
308
+ "rstrip": false,
309
+ "single_word": false
310
+ },
311
+ {
312
+ "content": "CSP",
313
+ "lstrip": false,
314
+ "normalized": false,
315
+ "rstrip": false,
316
+ "single_word": false
317
+ },
318
+ {
319
+ "content": "CTR",
320
+ "lstrip": false,
321
+ "normalized": false,
322
+ "rstrip": false,
323
+ "single_word": false
324
+ },
325
+ {
326
+ "content": "CTXT",
327
+ "lstrip": false,
328
+ "normalized": false,
329
+ "rstrip": false,
330
+ "single_word": false
331
+ },
332
+ {
333
+ "content": "CV",
334
+ "lstrip": false,
335
+ "normalized": false,
336
+ "rstrip": false,
337
+ "single_word": false
338
+ },
339
+ {
340
+ "content": "DBB",
341
+ "lstrip": false,
342
+ "normalized": false,
343
+ "rstrip": false,
344
+ "single_word": false
345
+ },
346
+ {
347
+ "content": "DEP",
348
+ "lstrip": false,
349
+ "normalized": false,
350
+ "rstrip": false,
351
+ "single_word": false
352
+ },
353
+ {
354
+ "content": "DEV",
355
+ "lstrip": false,
356
+ "normalized": false,
357
+ "rstrip": false,
358
+ "single_word": false
359
+ },
360
+ {
361
+ "content": "DFA",
362
+ "lstrip": false,
363
+ "normalized": false,
364
+ "rstrip": false,
365
+ "single_word": false
366
+ },
367
+ {
368
+ "content": "DFT",
369
+ "lstrip": false,
370
+ "normalized": false,
371
+ "rstrip": false,
372
+ "single_word": false
373
+ },
374
+ {
375
+ "content": "DIP",
376
+ "lstrip": false,
377
+ "normalized": false,
378
+ "rstrip": false,
379
+ "single_word": false
380
+ },
381
+ {
382
+ "content": "DISPLAY",
383
+ "lstrip": false,
384
+ "normalized": false,
385
+ "rstrip": false,
386
+ "single_word": false
387
+ },
388
+ {
389
+ "content": "DLA",
390
+ "lstrip": false,
391
+ "normalized": false,
392
+ "rstrip": false,
393
+ "single_word": false
394
+ },
395
+ {
396
+ "content": "DMA",
397
+ "lstrip": false,
398
+ "normalized": false,
399
+ "rstrip": false,
400
+ "single_word": false
401
+ },
402
+ {
403
+ "content": "DMEM",
404
+ "lstrip": false,
405
+ "normalized": false,
406
+ "rstrip": false,
407
+ "single_word": false
408
+ },
409
+ {
410
+ "content": "DPA",
411
+ "lstrip": false,
412
+ "normalized": false,
413
+ "rstrip": false,
414
+ "single_word": false
415
+ },
416
+ {
417
+ "content": "DSC",
418
+ "lstrip": false,
419
+ "normalized": false,
420
+ "rstrip": false,
421
+ "single_word": false
422
+ },
423
+ {
424
+ "content": "DT",
425
+ "lstrip": false,
426
+ "normalized": false,
427
+ "rstrip": false,
428
+ "single_word": false
429
+ },
430
+ {
431
+ "content": "DU",
432
+ "lstrip": false,
433
+ "normalized": false,
434
+ "rstrip": false,
435
+ "single_word": false
436
+ },
437
+ {
438
+ "content": "DVMU",
439
+ "lstrip": false,
440
+ "normalized": false,
441
+ "rstrip": false,
442
+ "single_word": false
443
+ },
444
+ {
445
+ "content": "EC",
446
+ "lstrip": false,
447
+ "normalized": false,
448
+ "rstrip": false,
449
+ "single_word": false
450
+ },
451
+ {
452
+ "content": "ECB",
453
+ "lstrip": false,
454
+ "normalized": false,
455
+ "rstrip": false,
456
+ "single_word": false
457
+ },
458
+ {
459
+ "content": "ECC",
460
+ "lstrip": false,
461
+ "normalized": false,
462
+ "rstrip": false,
463
+ "single_word": false
464
+ },
465
+ {
466
+ "content": "ECDHE",
467
+ "lstrip": false,
468
+ "normalized": false,
469
+ "rstrip": false,
470
+ "single_word": false
471
+ },
472
+ {
473
+ "content": "ECDSA",
474
+ "lstrip": false,
475
+ "normalized": false,
476
+ "rstrip": false,
477
+ "single_word": false
478
+ },
479
+ {
480
+ "content": "ECID",
481
+ "lstrip": false,
482
+ "normalized": false,
483
+ "rstrip": false,
484
+ "single_word": false
485
+ },
486
+ {
487
+ "content": "EDR",
488
+ "lstrip": false,
489
+ "normalized": false,
490
+ "rstrip": false,
491
+ "single_word": false
492
+ },
493
+ {
494
+ "content": "EOF",
495
+ "lstrip": false,
496
+ "normalized": false,
497
+ "rstrip": false,
498
+ "single_word": false
499
+ },
500
+ {
501
+ "content": "EOTTI",
502
+ "lstrip": false,
503
+ "normalized": false,
504
+ "rstrip": false,
505
+ "single_word": false
506
+ },
507
+ {
508
+ "content": "EQoS",
509
+ "lstrip": false,
510
+ "normalized": false,
511
+ "rstrip": false,
512
+ "single_word": false
513
+ },
514
+ {
515
+ "content": "FCL",
516
+ "lstrip": false,
517
+ "normalized": false,
518
+ "rstrip": false,
519
+ "single_word": false
520
+ },
521
+ {
522
+ "content": "FHTI",
523
+ "lstrip": false,
524
+ "normalized": false,
525
+ "rstrip": false,
526
+ "single_word": false
527
+ },
528
+ {
529
+ "content": "FIPS",
530
+ "lstrip": false,
531
+ "normalized": false,
532
+ "rstrip": false,
533
+ "single_word": false
534
+ },
535
+ {
536
+ "content": "FMEA",
537
+ "lstrip": false,
538
+ "normalized": false,
539
+ "rstrip": false,
540
+ "single_word": false
541
+ },
542
+ {
543
+ "content": "FMON",
544
+ "lstrip": false,
545
+ "normalized": false,
546
+ "rstrip": false,
547
+ "single_word": false
548
+ },
549
+ {
550
+ "content": "FO",
551
+ "lstrip": false,
552
+ "normalized": false,
553
+ "rstrip": false,
554
+ "single_word": false
555
+ },
556
+ {
557
+ "content": "FP",
558
+ "lstrip": false,
559
+ "normalized": false,
560
+ "rstrip": false,
561
+ "single_word": false
562
+ },
563
+ {
564
+ "content": "FPS",
565
+ "lstrip": false,
566
+ "normalized": false,
567
+ "rstrip": false,
568
+ "single_word": false
569
+ },
570
+ {
571
+ "content": "FW",
572
+ "lstrip": false,
573
+ "normalized": false,
574
+ "rstrip": false,
575
+ "single_word": false
576
+ },
577
+ {
578
+ "content": "FuSa",
579
+ "lstrip": false,
580
+ "normalized": false,
581
+ "rstrip": false,
582
+ "single_word": false
583
+ },
584
+ {
585
+ "content": "GCM",
586
+ "lstrip": false,
587
+ "normalized": false,
588
+ "rstrip": false,
589
+ "single_word": false
590
+ },
591
+ {
592
+ "content": "GFD",
593
+ "lstrip": false,
594
+ "normalized": false,
595
+ "rstrip": false,
596
+ "single_word": false
597
+ },
598
+ {
599
+ "content": "GIC",
600
+ "lstrip": false,
601
+ "normalized": false,
602
+ "rstrip": false,
603
+ "single_word": false
604
+ },
605
+ {
606
+ "content": "GMAC",
607
+ "lstrip": false,
608
+ "normalized": false,
609
+ "rstrip": false,
610
+ "single_word": false
611
+ },
612
+ {
613
+ "content": "GMSL",
614
+ "lstrip": false,
615
+ "normalized": false,
616
+ "rstrip": false,
617
+ "single_word": false
618
+ },
619
+ {
620
+ "content": "GOP",
621
+ "lstrip": false,
622
+ "normalized": false,
623
+ "rstrip": false,
624
+ "single_word": false
625
+ },
626
+ {
627
+ "content": "GP",
628
+ "lstrip": false,
629
+ "normalized": false,
630
+ "rstrip": false,
631
+ "single_word": false
632
+ },
633
+ {
634
+ "content": "GPCDMA",
635
+ "lstrip": false,
636
+ "normalized": false,
637
+ "rstrip": false,
638
+ "single_word": false
639
+ },
640
+ {
641
+ "content": "GPU",
642
+ "lstrip": false,
643
+ "normalized": false,
644
+ "rstrip": false,
645
+ "single_word": false
646
+ },
647
+ {
648
+ "content": "GR",
649
+ "lstrip": false,
650
+ "normalized": false,
651
+ "rstrip": false,
652
+ "single_word": false
653
+ },
654
+ {
655
+ "content": "Gpps",
656
+ "lstrip": false,
657
+ "normalized": false,
658
+ "rstrip": false,
659
+ "single_word": false
660
+ },
661
+ {
662
+ "content": "HBR",
663
+ "lstrip": false,
664
+ "normalized": false,
665
+ "rstrip": false,
666
+ "single_word": false
667
+ },
668
+ {
669
+ "content": "HBR2",
670
+ "lstrip": false,
671
+ "normalized": false,
672
+ "rstrip": false,
673
+ "single_word": false
674
+ },
675
+ {
676
+ "content": "HBR3",
677
+ "lstrip": false,
678
+ "normalized": false,
679
+ "rstrip": false,
680
+ "single_word": false
681
+ },
682
+ {
683
+ "content": "HDS",
684
+ "lstrip": false,
685
+ "normalized": false,
686
+ "rstrip": false,
687
+ "single_word": false
688
+ },
689
+ {
690
+ "content": "HIS",
691
+ "lstrip": false,
692
+ "normalized": false,
693
+ "rstrip": false,
694
+ "single_word": false
695
+ },
696
+ {
697
+ "content": "HMAC",
698
+ "lstrip": false,
699
+ "normalized": false,
700
+ "rstrip": false,
701
+ "single_word": false
702
+ },
703
+ {
704
+ "content": "HPSE",
705
+ "lstrip": false,
706
+ "normalized": false,
707
+ "rstrip": false,
708
+ "single_word": false
709
+ },
710
+ {
711
+ "content": "HSI",
712
+ "lstrip": false,
713
+ "normalized": false,
714
+ "rstrip": false,
715
+ "single_word": false
716
+ },
717
+ {
718
+ "content": "HSM",
719
+ "lstrip": false,
720
+ "normalized": false,
721
+ "rstrip": false,
722
+ "single_word": false
723
+ },
724
+ {
725
+ "content": "HSP",
726
+ "lstrip": false,
727
+ "normalized": false,
728
+ "rstrip": false,
729
+ "single_word": false
730
+ },
731
+ {
732
+ "content": "HW",
733
+ "lstrip": false,
734
+ "normalized": false,
735
+ "rstrip": false,
736
+ "single_word": false
737
+ },
738
+ {
739
+ "content": "IAS",
740
+ "lstrip": false,
741
+ "normalized": false,
742
+ "rstrip": false,
743
+ "single_word": false
744
+ },
745
+ {
746
+ "content": "IC",
747
+ "lstrip": false,
748
+ "normalized": false,
749
+ "rstrip": false,
750
+ "single_word": false
751
+ },
752
+ {
753
+ "content": "ICD",
754
+ "lstrip": false,
755
+ "normalized": false,
756
+ "rstrip": false,
757
+ "single_word": false
758
+ },
759
+ {
760
+ "content": "IDR",
761
+ "lstrip": false,
762
+ "normalized": false,
763
+ "rstrip": false,
764
+ "single_word": false
765
+ },
766
+ {
767
+ "content": "IDT",
768
+ "lstrip": false,
769
+ "normalized": false,
770
+ "rstrip": false,
771
+ "single_word": false
772
+ },
773
+ {
774
+ "content": "IEP",
775
+ "lstrip": false,
776
+ "normalized": false,
777
+ "rstrip": false,
778
+ "single_word": false
779
+ },
780
+ {
781
+ "content": "IEU",
782
+ "lstrip": false,
783
+ "normalized": false,
784
+ "rstrip": false,
785
+ "single_word": false
786
+ },
787
+ {
788
+ "content": "IFU",
789
+ "lstrip": false,
790
+ "normalized": false,
791
+ "rstrip": false,
792
+ "single_word": false
793
+ },
794
+ {
795
+ "content": "IID",
796
+ "lstrip": false,
797
+ "normalized": false,
798
+ "rstrip": false,
799
+ "single_word": false
800
+ },
801
+ {
802
+ "content": "ILD",
803
+ "lstrip": false,
804
+ "normalized": false,
805
+ "rstrip": false,
806
+ "single_word": false
807
+ },
808
+ {
809
+ "content": "IMEM",
810
+ "lstrip": false,
811
+ "normalized": false,
812
+ "rstrip": false,
813
+ "single_word": false
814
+ },
815
+ {
816
+ "content": "IOC",
817
+ "lstrip": false,
818
+ "normalized": false,
819
+ "rstrip": false,
820
+ "single_word": false
821
+ },
822
+ {
823
+ "content": "IOFA",
824
+ "lstrip": false,
825
+ "normalized": false,
826
+ "rstrip": false,
827
+ "single_word": false
828
+ },
829
+ {
830
+ "content": "IOMMU",
831
+ "lstrip": false,
832
+ "normalized": false,
833
+ "rstrip": false,
834
+ "single_word": false
835
+ },
836
+ {
837
+ "content": "IPC",
838
+ "lstrip": false,
839
+ "normalized": false,
840
+ "rstrip": false,
841
+ "single_word": false
842
+ },
843
+ {
844
+ "content": "IPI",
845
+ "lstrip": false,
846
+ "normalized": false,
847
+ "rstrip": false,
848
+ "single_word": false
849
+ },
850
+ {
851
+ "content": "IRF",
852
+ "lstrip": false,
853
+ "normalized": false,
854
+ "rstrip": false,
855
+ "single_word": false
856
+ },
857
+ {
858
+ "content": "IST",
859
+ "lstrip": false,
860
+ "normalized": false,
861
+ "rstrip": false,
862
+ "single_word": false
863
+ },
864
+ {
865
+ "content": "IV",
866
+ "lstrip": false,
867
+ "normalized": false,
868
+ "rstrip": false,
869
+ "single_word": false
870
+ },
871
+ {
872
+ "content": "IoT",
873
+ "lstrip": false,
874
+ "normalized": false,
875
+ "rstrip": false,
876
+ "single_word": false
877
+ },
878
+ {
879
+ "content": "JSR",
880
+ "lstrip": false,
881
+ "normalized": false,
882
+ "rstrip": false,
883
+ "single_word": false
884
+ },
885
+ {
886
+ "content": "KAT",
887
+ "lstrip": false,
888
+ "normalized": false,
889
+ "rstrip": false,
890
+ "single_word": false
891
+ },
892
+ {
893
+ "content": "KCV",
894
+ "lstrip": false,
895
+ "normalized": false,
896
+ "rstrip": false,
897
+ "single_word": false
898
+ },
899
+ {
900
+ "content": "KDF",
901
+ "lstrip": false,
902
+ "normalized": false,
903
+ "rstrip": false,
904
+ "single_word": false
905
+ },
906
+ {
907
+ "content": "KPI",
908
+ "lstrip": false,
909
+ "normalized": false,
910
+ "rstrip": false,
911
+ "single_word": false
912
+ },
913
+ {
914
+ "content": "L1PT",
915
+ "lstrip": false,
916
+ "normalized": false,
917
+ "rstrip": false,
918
+ "single_word": false
919
+ },
920
+ {
921
+ "content": "L2C",
922
+ "lstrip": false,
923
+ "normalized": false,
924
+ "rstrip": false,
925
+ "single_word": false
926
+ },
927
+ {
928
+ "content": "L2mDIR",
929
+ "lstrip": false,
930
+ "normalized": false,
931
+ "rstrip": false,
932
+ "single_word": false
933
+ },
934
+ {
935
+ "content": "L2vDIR",
936
+ "lstrip": false,
937
+ "normalized": false,
938
+ "rstrip": false,
939
+ "single_word": false
940
+ },
941
+ {
942
+ "content": "LAB",
943
+ "lstrip": false,
944
+ "normalized": false,
945
+ "rstrip": false,
946
+ "single_word": false
947
+ },
948
+ {
949
+ "content": "LBIST",
950
+ "lstrip": false,
951
+ "normalized": false,
952
+ "rstrip": false,
953
+ "single_word": false
954
+ },
955
+ {
956
+ "content": "LDC",
957
+ "lstrip": false,
958
+ "normalized": false,
959
+ "rstrip": false,
960
+ "single_word": false
961
+ },
962
+ {
963
+ "content": "LFT",
964
+ "lstrip": false,
965
+ "normalized": false,
966
+ "rstrip": false,
967
+ "single_word": false
968
+ },
969
+ {
970
+ "content": "LIC",
971
+ "lstrip": false,
972
+ "normalized": false,
973
+ "rstrip": false,
974
+ "single_word": false
975
+ },
976
+ {
977
+ "content": "LIP",
978
+ "lstrip": false,
979
+ "normalized": false,
980
+ "rstrip": false,
981
+ "single_word": false
982
+ },
983
+ {
984
+ "content": "LSB",
985
+ "lstrip": false,
986
+ "normalized": false,
987
+ "rstrip": false,
988
+ "single_word": false
989
+ },
990
+ {
991
+ "content": "MAC",
992
+ "lstrip": false,
993
+ "normalized": false,
994
+ "rstrip": false,
995
+ "single_word": false
996
+ },
997
+ {
998
+ "content": "MAQ",
999
+ "lstrip": false,
1000
+ "normalized": false,
1001
+ "rstrip": false,
1002
+ "single_word": false
1003
+ },
1004
+ {
1005
+ "content": "MB",
1006
+ "lstrip": false,
1007
+ "normalized": false,
1008
+ "rstrip": false,
1009
+ "single_word": false
1010
+ },
1011
+ {
1012
+ "content": "MBIST",
1013
+ "lstrip": false,
1014
+ "normalized": false,
1015
+ "rstrip": false,
1016
+ "single_word": false
1017
+ },
1018
+ {
1019
+ "content": "MCAL",
1020
+ "lstrip": false,
1021
+ "normalized": false,
1022
+ "rstrip": false,
1023
+ "single_word": false
1024
+ },
1025
+ {
1026
+ "content": "MCE",
1027
+ "lstrip": false,
1028
+ "normalized": false,
1029
+ "rstrip": false,
1030
+ "single_word": false
1031
+ },
1032
+ {
1033
+ "content": "MCU",
1034
+ "lstrip": false,
1035
+ "normalized": false,
1036
+ "rstrip": false,
1037
+ "single_word": false
1038
+ },
1039
+ {
1040
+ "content": "MSB",
1041
+ "lstrip": false,
1042
+ "normalized": false,
1043
+ "rstrip": false,
1044
+ "single_word": false
1045
+ },
1046
+ {
1047
+ "content": "MSS",
1048
+ "lstrip": false,
1049
+ "normalized": false,
1050
+ "rstrip": false,
1051
+ "single_word": false
1052
+ },
1053
+ {
1054
+ "content": "MST",
1055
+ "lstrip": false,
1056
+ "normalized": false,
1057
+ "rstrip": false,
1058
+ "single_word": false
1059
+ },
1060
+ {
1061
+ "content": "MTS",
1062
+ "lstrip": false,
1063
+ "normalized": false,
1064
+ "rstrip": false,
1065
+ "single_word": false
1066
+ },
1067
+ {
1068
+ "content": "MiTM",
1069
+ "lstrip": false,
1070
+ "normalized": false,
1071
+ "rstrip": false,
1072
+ "single_word": false
1073
+ },
1074
+ {
1075
+ "content": "NIP",
1076
+ "lstrip": false,
1077
+ "normalized": false,
1078
+ "rstrip": false,
1079
+ "single_word": false
1080
+ },
1081
+ {
1082
+ "content": "NIST",
1083
+ "lstrip": false,
1084
+ "normalized": false,
1085
+ "rstrip": false,
1086
+ "single_word": false
1087
+ },
1088
+ {
1089
+ "content": "NITO",
1090
+ "lstrip": false,
1091
+ "normalized": false,
1092
+ "rstrip": false,
1093
+ "single_word": false
1094
+ },
1095
+ {
1096
+ "content": "NOC",
1097
+ "lstrip": false,
1098
+ "normalized": false,
1099
+ "rstrip": false,
1100
+ "single_word": false
1101
+ },
1102
+ {
1103
+ "content": "NOOP",
1104
+ "lstrip": false,
1105
+ "normalized": false,
1106
+ "rstrip": false,
1107
+ "single_word": false
1108
+ },
1109
+ {
1110
+ "content": "NT",
1111
+ "lstrip": false,
1112
+ "normalized": false,
1113
+ "rstrip": false,
1114
+ "single_word": false
1115
+ },
1116
+ {
1117
+ "content": "NVDEC",
1118
+ "lstrip": false,
1119
+ "normalized": false,
1120
+ "rstrip": false,
1121
+ "single_word": false
1122
+ },
1123
+ {
1124
+ "content": "NVENC",
1125
+ "lstrip": false,
1126
+ "normalized": false,
1127
+ "rstrip": false,
1128
+ "single_word": false
1129
+ },
1130
+ {
1131
+ "content": "NVJPG",
1132
+ "lstrip": false,
1133
+ "normalized": false,
1134
+ "rstrip": false,
1135
+ "single_word": false
1136
+ },
1137
+ {
1138
+ "content": "NVM",
1139
+ "lstrip": false,
1140
+ "normalized": false,
1141
+ "rstrip": false,
1142
+ "single_word": false
1143
+ },
1144
+ {
1145
+ "content": "NVVSE",
1146
+ "lstrip": false,
1147
+ "normalized": false,
1148
+ "rstrip": false,
1149
+ "single_word": false
1150
+ },
1151
+ {
1152
+ "content": "OEM",
1153
+ "lstrip": false,
1154
+ "normalized": false,
1155
+ "rstrip": false,
1156
+ "single_word": false
1157
+ },
1158
+ {
1159
+ "content": "OFA",
1160
+ "lstrip": false,
1161
+ "normalized": false,
1162
+ "rstrip": false,
1163
+ "single_word": false
1164
+ },
1165
+ {
1166
+ "content": "OS",
1167
+ "lstrip": false,
1168
+ "normalized": false,
1169
+ "rstrip": false,
1170
+ "single_word": false
1171
+ },
1172
+ {
1173
+ "content": "OSP",
1174
+ "lstrip": false,
1175
+ "normalized": false,
1176
+ "rstrip": false,
1177
+ "single_word": false
1178
+ },
1179
+ {
1180
+ "content": "OTP",
1181
+ "lstrip": false,
1182
+ "normalized": false,
1183
+ "rstrip": false,
1184
+ "single_word": false
1185
+ },
1186
+ {
1187
+ "content": "PB",
1188
+ "lstrip": false,
1189
+ "normalized": false,
1190
+ "rstrip": false,
1191
+ "single_word": false
1192
+ },
1193
+ {
1194
+ "content": "PCIE",
1195
+ "lstrip": false,
1196
+ "normalized": false,
1197
+ "rstrip": false,
1198
+ "single_word": false
1199
+ },
1200
+ {
1201
+ "content": "PCPU",
1202
+ "lstrip": false,
1203
+ "normalized": false,
1204
+ "rstrip": false,
1205
+ "single_word": false
1206
+ },
1207
+ {
1208
+ "content": "PCR",
1209
+ "lstrip": false,
1210
+ "normalized": false,
1211
+ "rstrip": false,
1212
+ "single_word": false
1213
+ },
1214
+ {
1215
+ "content": "PCT",
1216
+ "lstrip": false,
1217
+ "normalized": false,
1218
+ "rstrip": false,
1219
+ "single_word": false
1220
+ },
1221
+ {
1222
+ "content": "PDK",
1223
+ "lstrip": false,
1224
+ "normalized": false,
1225
+ "rstrip": false,
1226
+ "single_word": false
1227
+ },
1228
+ {
1229
+ "content": "PII",
1230
+ "lstrip": false,
1231
+ "normalized": false,
1232
+ "rstrip": false,
1233
+ "single_word": false
1234
+ },
1235
+ {
1236
+ "content": "PIP",
1237
+ "lstrip": false,
1238
+ "normalized": false,
1239
+ "rstrip": false,
1240
+ "single_word": false
1241
+ },
1242
+ {
1243
+ "content": "PKC",
1244
+ "lstrip": false,
1245
+ "normalized": false,
1246
+ "rstrip": false,
1247
+ "single_word": false
1248
+ },
1249
+ {
1250
+ "content": "PKCS",
1251
+ "lstrip": false,
1252
+ "normalized": false,
1253
+ "rstrip": false,
1254
+ "single_word": false
1255
+ },
1256
+ {
1257
+ "content": "PKI",
1258
+ "lstrip": false,
1259
+ "normalized": false,
1260
+ "rstrip": false,
1261
+ "single_word": false
1262
+ },
1263
+ {
1264
+ "content": "PL",
1265
+ "lstrip": false,
1266
+ "normalized": false,
1267
+ "rstrip": false,
1268
+ "single_word": false
1269
+ },
1270
+ {
1271
+ "content": "PLA",
1272
+ "lstrip": false,
1273
+ "normalized": false,
1274
+ "rstrip": false,
1275
+ "single_word": false
1276
+ },
1277
+ {
1278
+ "content": "POR",
1279
+ "lstrip": false,
1280
+ "normalized": false,
1281
+ "rstrip": false,
1282
+ "single_word": false
1283
+ },
1284
+ {
1285
+ "content": "PPC",
1286
+ "lstrip": false,
1287
+ "normalized": false,
1288
+ "rstrip": false,
1289
+ "single_word": false
1290
+ },
1291
+ {
1292
+ "content": "PSC",
1293
+ "lstrip": false,
1294
+ "normalized": false,
1295
+ "rstrip": false,
1296
+ "single_word": false
1297
+ },
1298
+ {
1299
+ "content": "PTXT",
1300
+ "lstrip": false,
1301
+ "normalized": false,
1302
+ "rstrip": false,
1303
+ "single_word": false
1304
+ },
1305
+ {
1306
+ "content": "PVA",
1307
+ "lstrip": false,
1308
+ "normalized": false,
1309
+ "rstrip": false,
1310
+ "single_word": false
1311
+ },
1312
+ {
1313
+ "content": "QNX",
1314
+ "lstrip": false,
1315
+ "normalized": false,
1316
+ "rstrip": false,
1317
+ "single_word": false
1318
+ },
1319
+ {
1320
+ "content": "QOS",
1321
+ "lstrip": false,
1322
+ "normalized": false,
1323
+ "rstrip": false,
1324
+ "single_word": false
1325
+ },
1326
+ {
1327
+ "content": "QSPI",
1328
+ "lstrip": false,
1329
+ "normalized": false,
1330
+ "rstrip": false,
1331
+ "single_word": false
1332
+ },
1333
+ {
1334
+ "content": "RBG",
1335
+ "lstrip": false,
1336
+ "normalized": false,
1337
+ "rstrip": false,
1338
+ "single_word": false
1339
+ },
1340
+ {
1341
+ "content": "RBR",
1342
+ "lstrip": false,
1343
+ "normalized": false,
1344
+ "rstrip": false,
1345
+ "single_word": false
1346
+ },
1347
+ {
1348
+ "content": "RC",
1349
+ "lstrip": false,
1350
+ "normalized": false,
1351
+ "rstrip": false,
1352
+ "single_word": false
1353
+ },
1354
+ {
1355
+ "content": "RDEV",
1356
+ "lstrip": false,
1357
+ "normalized": false,
1358
+ "rstrip": false,
1359
+ "single_word": false
1360
+ },
1361
+ {
1362
+ "content": "REE",
1363
+ "lstrip": false,
1364
+ "normalized": false,
1365
+ "rstrip": false,
1366
+ "single_word": false
1367
+ },
1368
+ {
1369
+ "content": "RMA",
1370
+ "lstrip": false,
1371
+ "normalized": false,
1372
+ "rstrip": false,
1373
+ "single_word": false
1374
+ },
1375
+ {
1376
+ "content": "RMW",
1377
+ "lstrip": false,
1378
+ "normalized": false,
1379
+ "rstrip": false,
1380
+ "single_word": false
1381
+ },
1382
+ {
1383
+ "content": "RSA",
1384
+ "lstrip": false,
1385
+ "normalized": false,
1386
+ "rstrip": false,
1387
+ "single_word": false
1388
+ },
1389
+ {
1390
+ "content": "RSB",
1391
+ "lstrip": false,
1392
+ "normalized": false,
1393
+ "rstrip": false,
1394
+ "single_word": false
1395
+ },
1396
+ {
1397
+ "content": "RTS",
1398
+ "lstrip": false,
1399
+ "normalized": false,
1400
+ "rstrip": false,
1401
+ "single_word": false
1402
+ },
1403
+ {
1404
+ "content": "RoT",
1405
+ "lstrip": false,
1406
+ "normalized": false,
1407
+ "rstrip": false,
1408
+ "single_word": false
1409
+ },
1410
+ {
1411
+ "content": "SAE",
1412
+ "lstrip": false,
1413
+ "normalized": false,
1414
+ "rstrip": false,
1415
+ "single_word": false
1416
+ },
1417
+ {
1418
+ "content": "SBK",
1419
+ "lstrip": false,
1420
+ "normalized": false,
1421
+ "rstrip": false,
1422
+ "single_word": false
1423
+ },
1424
+ {
1425
+ "content": "SCH",
1426
+ "lstrip": false,
1427
+ "normalized": false,
1428
+ "rstrip": false,
1429
+ "single_word": false
1430
+ },
1431
+ {
1432
+ "content": "SDK",
1433
+ "lstrip": false,
1434
+ "normalized": false,
1435
+ "rstrip": false,
1436
+ "single_word": false
1437
+ },
1438
+ {
1439
+ "content": "SE",
1440
+ "lstrip": false,
1441
+ "normalized": false,
1442
+ "rstrip": false,
1443
+ "single_word": false
1444
+ },
1445
+ {
1446
+ "content": "SEL0",
1447
+ "lstrip": false,
1448
+ "normalized": false,
1449
+ "rstrip": false,
1450
+ "single_word": false
1451
+ },
1452
+ {
1453
+ "content": "SEL1",
1454
+ "lstrip": false,
1455
+ "normalized": false,
1456
+ "rstrip": false,
1457
+ "single_word": false
1458
+ },
1459
+ {
1460
+ "content": "SEooC",
1461
+ "lstrip": false,
1462
+ "normalized": false,
1463
+ "rstrip": false,
1464
+ "single_word": false
1465
+ },
1466
+ {
1467
+ "content": "SGM",
1468
+ "lstrip": false,
1469
+ "normalized": false,
1470
+ "rstrip": false,
1471
+ "single_word": false
1472
+ },
1473
+ {
1474
+ "content": "SHA",
1475
+ "lstrip": false,
1476
+ "normalized": false,
1477
+ "rstrip": false,
1478
+ "single_word": false
1479
+ },
1480
+ {
1481
+ "content": "SHA256",
1482
+ "lstrip": false,
1483
+ "normalized": false,
1484
+ "rstrip": false,
1485
+ "single_word": false
1486
+ },
1487
+ {
1488
+ "content": "SHA512",
1489
+ "lstrip": false,
1490
+ "normalized": false,
1491
+ "rstrip": false,
1492
+ "single_word": false
1493
+ },
1494
+ {
1495
+ "content": "SHE",
1496
+ "lstrip": false,
1497
+ "normalized": false,
1498
+ "rstrip": false,
1499
+ "single_word": false
1500
+ },
1501
+ {
1502
+ "content": "SKU",
1503
+ "lstrip": false,
1504
+ "normalized": false,
1505
+ "rstrip": false,
1506
+ "single_word": false
1507
+ },
1508
+ {
1509
+ "content": "SNOC",
1510
+ "lstrip": false,
1511
+ "normalized": false,
1512
+ "rstrip": false,
1513
+ "single_word": false
1514
+ },
1515
+ {
1516
+ "content": "SO",
1517
+ "lstrip": false,
1518
+ "normalized": false,
1519
+ "rstrip": false,
1520
+ "single_word": false
1521
+ },
1522
+ {
1523
+ "content": "SPA",
1524
+ "lstrip": false,
1525
+ "normalized": false,
1526
+ "rstrip": false,
1527
+ "single_word": false
1528
+ },
1529
+ {
1530
+ "content": "SQ",
1531
+ "lstrip": false,
1532
+ "normalized": false,
1533
+ "rstrip": false,
1534
+ "single_word": false
1535
+ },
1536
+ {
1537
+ "content": "SSR",
1538
+ "lstrip": false,
1539
+ "normalized": false,
1540
+ "rstrip": false,
1541
+ "single_word": false
1542
+ },
1543
+ {
1544
+ "content": "SST",
1545
+ "lstrip": false,
1546
+ "normalized": false,
1547
+ "rstrip": false,
1548
+ "single_word": false
1549
+ },
1550
+ {
1551
+ "content": "SW",
1552
+ "lstrip": false,
1553
+ "normalized": false,
1554
+ "rstrip": false,
1555
+ "single_word": false
1556
+ },
1557
+ {
1558
+ "content": "SWAT",
1559
+ "lstrip": false,
1560
+ "normalized": false,
1561
+ "rstrip": false,
1562
+ "single_word": false
1563
+ },
1564
+ {
1565
+ "content": "SoC",
1566
+ "lstrip": false,
1567
+ "normalized": false,
1568
+ "rstrip": false,
1569
+ "single_word": false
1570
+ },
1571
+ {
1572
+ "content": "TA",
1573
+ "lstrip": false,
1574
+ "normalized": false,
1575
+ "rstrip": false,
1576
+ "single_word": false
1577
+ },
1578
+ {
1579
+ "content": "TCF",
1580
+ "lstrip": false,
1581
+ "normalized": false,
1582
+ "rstrip": false,
1583
+ "single_word": false
1584
+ },
1585
+ {
1586
+ "content": "TEE",
1587
+ "lstrip": false,
1588
+ "normalized": false,
1589
+ "rstrip": false,
1590
+ "single_word": false
1591
+ },
1592
+ {
1593
+ "content": "THI",
1594
+ "lstrip": false,
1595
+ "normalized": false,
1596
+ "rstrip": false,
1597
+ "single_word": false
1598
+ },
1599
+ {
1600
+ "content": "TNR",
1601
+ "lstrip": false,
1602
+ "normalized": false,
1603
+ "rstrip": false,
1604
+ "single_word": false
1605
+ },
1606
+ {
1607
+ "content": "TOS",
1608
+ "lstrip": false,
1609
+ "normalized": false,
1610
+ "rstrip": false,
1611
+ "single_word": false
1612
+ },
1613
+ {
1614
+ "content": "TRC",
1615
+ "lstrip": false,
1616
+ "normalized": false,
1617
+ "rstrip": false,
1618
+ "single_word": false
1619
+ },
1620
+ {
1621
+ "content": "TRL",
1622
+ "lstrip": false,
1623
+ "normalized": false,
1624
+ "rstrip": false,
1625
+ "single_word": false
1626
+ },
1627
+ {
1628
+ "content": "TSEC",
1629
+ "lstrip": false,
1630
+ "normalized": false,
1631
+ "rstrip": false,
1632
+ "single_word": false
1633
+ },
1634
+ {
1635
+ "content": "TZ",
1636
+ "lstrip": false,
1637
+ "normalized": false,
1638
+ "rstrip": false,
1639
+ "single_word": false
1640
+ },
1641
+ {
1642
+ "content": "UFS",
1643
+ "lstrip": false,
1644
+ "normalized": false,
1645
+ "rstrip": false,
1646
+ "single_word": false
1647
+ },
1648
+ {
1649
+ "content": "VBR",
1650
+ "lstrip": false,
1651
+ "normalized": false,
1652
+ "rstrip": false,
1653
+ "single_word": false
1654
+ },
1655
+ {
1656
+ "content": "VCPU",
1657
+ "lstrip": false,
1658
+ "normalized": false,
1659
+ "rstrip": false,
1660
+ "single_word": false
1661
+ },
1662
+ {
1663
+ "content": "VI",
1664
+ "lstrip": false,
1665
+ "normalized": false,
1666
+ "rstrip": false,
1667
+ "single_word": false
1668
+ },
1669
+ {
1670
+ "content": "VIC",
1671
+ "lstrip": false,
1672
+ "normalized": false,
1673
+ "rstrip": false,
1674
+ "single_word": false
1675
+ },
1676
+ {
1677
+ "content": "VMEM",
1678
+ "lstrip": false,
1679
+ "normalized": false,
1680
+ "rstrip": false,
1681
+ "single_word": false
1682
+ },
1683
+ {
1684
+ "content": "VMID",
1685
+ "lstrip": false,
1686
+ "normalized": false,
1687
+ "rstrip": false,
1688
+ "single_word": false
1689
+ },
1690
+ {
1691
+ "content": "VPU",
1692
+ "lstrip": false,
1693
+ "normalized": false,
1694
+ "rstrip": false,
1695
+ "single_word": false
1696
+ },
1697
+ {
1698
+ "content": "VRC",
1699
+ "lstrip": false,
1700
+ "normalized": false,
1701
+ "rstrip": false,
1702
+ "single_word": false
1703
+ },
1704
+ {
1705
+ "content": "VUI",
1706
+ "lstrip": false,
1707
+ "normalized": false,
1708
+ "rstrip": false,
1709
+ "single_word": false
1710
+ },
1711
+ {
1712
+ "content": "WARB",
1713
+ "lstrip": false,
1714
+ "normalized": false,
1715
+ "rstrip": false,
1716
+ "single_word": false
1717
+ },
1718
+ {
1719
+ "content": "XIP",
1720
+ "lstrip": false,
1721
+ "normalized": false,
1722
+ "rstrip": false,
1723
+ "single_word": false
1724
+ },
1725
+ {
1726
+ "content": "bpp",
1727
+ "lstrip": false,
1728
+ "normalized": false,
1729
+ "rstrip": false,
1730
+ "single_word": false
1731
+ },
1732
+ {
1733
+ "content": "eMMC",
1734
+ "lstrip": false,
1735
+ "normalized": false,
1736
+ "rstrip": false,
1737
+ "single_word": false
1738
+ },
1739
+ {
1740
+ "content": "hfPLA",
1741
+ "lstrip": false,
1742
+ "normalized": false,
1743
+ "rstrip": false,
1744
+ "single_word": false
1745
+ },
1746
+ {
1747
+ "content": "iGPU",
1748
+ "lstrip": false,
1749
+ "normalized": false,
1750
+ "rstrip": false,
1751
+ "single_word": false
1752
+ },
1753
+ {
1754
+ "content": "ipc",
1755
+ "lstrip": false,
1756
+ "normalized": false,
1757
+ "rstrip": false,
1758
+ "single_word": false
1759
+ },
1760
+ {
1761
+ "content": "ipc_fg",
1762
+ "lstrip": false,
1763
+ "normalized": false,
1764
+ "rstrip": false,
1765
+ "single_word": false
1766
+ },
1767
+ {
1768
+ "content": "ipc_t",
1769
+ "lstrip": false,
1770
+ "normalized": false,
1771
+ "rstrip": false,
1772
+ "single_word": false
1773
+ },
1774
+ {
1775
+ "content": "sbPLA",
1776
+ "lstrip": false,
1777
+ "normalized": false,
1778
+ "rstrip": false,
1779
+ "single_word": false
1780
+ },
1781
+ {
1782
+ "content": "xBTV",
1783
+ "lstrip": false,
1784
+ "normalized": false,
1785
+ "rstrip": false,
1786
+ "single_word": false
1787
+ },
1788
+ {
1789
+ "content": "xps",
1790
+ "lstrip": false,
1791
+ "normalized": false,
1792
+ "rstrip": false,
1793
+ "single_word": false
1794
+ }
1795
+ ],
1796
+ "bos_token": {
1797
+ "content": "<|startoftext|>",
1798
+ "lstrip": false,
1799
+ "normalized": false,
1800
+ "rstrip": false,
1801
+ "single_word": false
1802
+ },
1803
+ "eos_token": {
1804
+ "content": "<|return|>",
1805
+ "lstrip": false,
1806
+ "normalized": false,
1807
+ "rstrip": false,
1808
+ "single_word": false
1809
+ },
1810
+ "pad_token": {
1811
+ "content": "<|endoftext|>",
1812
+ "lstrip": false,
1813
+ "normalized": false,
1814
+ "rstrip": false,
1815
+ "single_word": false
1816
+ }
1817
+ }
checkpoint-1642/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ec3af79eb37b392bb5382bfe3f4eeab633498c220a804f4fd5d7d102a000f1a
3
+ size 27914312
checkpoint-1642/tokenizer_config.json ADDED
@@ -0,0 +1,2489 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "1529": {
4
+ "content": "SE",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "2022": {
12
+ "content": "IC",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2416": {
20
+ "content": "AD",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3360": {
28
+ "content": "OS",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "4478": {
36
+ "content": "IV",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ },
43
+ "5173": {
44
+ "content": "PL",
45
+ "lstrip": false,
46
+ "normalized": false,
47
+ "rstrip": false,
48
+ "single_word": false,
49
+ "special": true
50
+ },
51
+ "6258": {
52
+ "content": "IST",
53
+ "lstrip": false,
54
+ "normalized": false,
55
+ "rstrip": false,
56
+ "single_word": false,
57
+ "special": true
58
+ },
59
+ "6781": {
60
+ "content": "CA",
61
+ "lstrip": false,
62
+ "normalized": false,
63
+ "rstrip": false,
64
+ "single_word": false,
65
+ "special": true
66
+ },
67
+ "7726": {
68
+ "content": "FO",
69
+ "lstrip": false,
70
+ "normalized": false,
71
+ "rstrip": false,
72
+ "single_word": false,
73
+ "special": true
74
+ },
75
+ "9375": {
76
+ "content": "REE",
77
+ "lstrip": false,
78
+ "normalized": false,
79
+ "rstrip": false,
80
+ "single_word": false,
81
+ "special": true
82
+ },
83
+ "9760": {
84
+ "content": "EC",
85
+ "lstrip": false,
86
+ "normalized": false,
87
+ "rstrip": false,
88
+ "single_word": false,
89
+ "special": true
90
+ },
91
+ "10227": {
92
+ "content": "TA",
93
+ "lstrip": false,
94
+ "normalized": false,
95
+ "rstrip": false,
96
+ "single_word": false,
97
+ "special": true
98
+ },
99
+ "11720": {
100
+ "content": "LIC",
101
+ "lstrip": false,
102
+ "normalized": false,
103
+ "rstrip": false,
104
+ "single_word": false,
105
+ "special": true
106
+ },
107
+ "12235": {
108
+ "content": "NT",
109
+ "lstrip": false,
110
+ "normalized": false,
111
+ "rstrip": false,
112
+ "single_word": false,
113
+ "special": true
114
+ },
115
+ "12515": {
116
+ "content": "RC",
117
+ "lstrip": false,
118
+ "normalized": false,
119
+ "rstrip": false,
120
+ "single_word": false,
121
+ "special": true
122
+ },
123
+ "13874": {
124
+ "content": "MB",
125
+ "lstrip": false,
126
+ "normalized": false,
127
+ "rstrip": false,
128
+ "single_word": false,
129
+ "special": true
130
+ },
131
+ "13905": {
132
+ "content": "GR",
133
+ "lstrip": false,
134
+ "normalized": false,
135
+ "rstrip": false,
136
+ "single_word": false,
137
+ "special": true
138
+ },
139
+ "15409": {
140
+ "content": "DU",
141
+ "lstrip": false,
142
+ "normalized": false,
143
+ "rstrip": false,
144
+ "single_word": false,
145
+ "special": true
146
+ },
147
+ "17183": {
148
+ "content": "DT",
149
+ "lstrip": false,
150
+ "normalized": false,
151
+ "rstrip": false,
152
+ "single_word": false,
153
+ "special": true
154
+ },
155
+ "19862": {
156
+ "content": "SO",
157
+ "lstrip": false,
158
+ "normalized": false,
159
+ "rstrip": false,
160
+ "single_word": false,
161
+ "special": true
162
+ },
163
+ "20174": {
164
+ "content": "FP",
165
+ "lstrip": false,
166
+ "normalized": false,
167
+ "rstrip": false,
168
+ "single_word": false,
169
+ "special": true
170
+ },
171
+ "22723": {
172
+ "content": "VI",
173
+ "lstrip": false,
174
+ "normalized": false,
175
+ "rstrip": false,
176
+ "single_word": false,
177
+ "special": true
178
+ },
179
+ "27968": {
180
+ "content": "SW",
181
+ "lstrip": false,
182
+ "normalized": false,
183
+ "rstrip": false,
184
+ "single_word": false,
185
+ "special": true
186
+ },
187
+ "29829": {
188
+ "content": "CV",
189
+ "lstrip": false,
190
+ "normalized": false,
191
+ "rstrip": false,
192
+ "single_word": false,
193
+ "special": true
194
+ },
195
+ "29864": {
196
+ "content": "GP",
197
+ "lstrip": false,
198
+ "normalized": false,
199
+ "rstrip": false,
200
+ "single_word": false,
201
+ "special": true
202
+ },
203
+ "34134": {
204
+ "content": "ILD",
205
+ "lstrip": false,
206
+ "normalized": false,
207
+ "rstrip": false,
208
+ "single_word": false,
209
+ "special": true
210
+ },
211
+ "34435": {
212
+ "content": "FW",
213
+ "lstrip": false,
214
+ "normalized": false,
215
+ "rstrip": false,
216
+ "single_word": false,
217
+ "special": true
218
+ },
219
+ "39749": {
220
+ "content": "TRL",
221
+ "lstrip": false,
222
+ "normalized": false,
223
+ "rstrip": false,
224
+ "single_word": false,
225
+ "special": true
226
+ },
227
+ "43230": {
228
+ "content": "LAB",
229
+ "lstrip": false,
230
+ "normalized": false,
231
+ "rstrip": false,
232
+ "single_word": false,
233
+ "special": true
234
+ },
235
+ "46966": {
236
+ "content": "SDK",
237
+ "lstrip": false,
238
+ "normalized": false,
239
+ "rstrip": false,
240
+ "single_word": false,
241
+ "special": true
242
+ },
243
+ "47787": {
244
+ "content": "CPU",
245
+ "lstrip": false,
246
+ "normalized": false,
247
+ "rstrip": false,
248
+ "single_word": false,
249
+ "special": true
250
+ },
251
+ "47994": {
252
+ "content": "MAC",
253
+ "lstrip": false,
254
+ "normalized": false,
255
+ "rstrip": false,
256
+ "single_word": false,
257
+ "special": true
258
+ },
259
+ "50719": {
260
+ "content": "IAS",
261
+ "lstrip": false,
262
+ "normalized": false,
263
+ "rstrip": false,
264
+ "single_word": false,
265
+ "special": true
266
+ },
267
+ "52907": {
268
+ "content": "CAR",
269
+ "lstrip": false,
270
+ "normalized": false,
271
+ "rstrip": false,
272
+ "single_word": false,
273
+ "special": true
274
+ },
275
+ "54793": {
276
+ "content": "EOF",
277
+ "lstrip": false,
278
+ "normalized": false,
279
+ "rstrip": false,
280
+ "single_word": false,
281
+ "special": true
282
+ },
283
+ "58530": {
284
+ "content": "PB",
285
+ "lstrip": false,
286
+ "normalized": false,
287
+ "rstrip": false,
288
+ "single_word": false,
289
+ "special": true
290
+ },
291
+ "66773": {
292
+ "content": "DEV",
293
+ "lstrip": false,
294
+ "normalized": false,
295
+ "rstrip": false,
296
+ "single_word": false,
297
+ "special": true
298
+ },
299
+ "68495": {
300
+ "content": "HW",
301
+ "lstrip": false,
302
+ "normalized": false,
303
+ "rstrip": false,
304
+ "single_word": false,
305
+ "special": true
306
+ },
307
+ "70684": {
308
+ "content": "SHA",
309
+ "lstrip": false,
310
+ "normalized": false,
311
+ "rstrip": false,
312
+ "single_word": false,
313
+ "special": true
314
+ },
315
+ "72089": {
316
+ "content": "SKU",
317
+ "lstrip": false,
318
+ "normalized": false,
319
+ "rstrip": false,
320
+ "single_word": false,
321
+ "special": true
322
+ },
323
+ "74923": {
324
+ "content": "CAN",
325
+ "lstrip": false,
326
+ "normalized": false,
327
+ "rstrip": false,
328
+ "single_word": false,
329
+ "special": true
330
+ },
331
+ "77411": {
332
+ "content": "AKE",
333
+ "lstrip": false,
334
+ "normalized": false,
335
+ "rstrip": false,
336
+ "single_word": false,
337
+ "special": true
338
+ },
339
+ "81990": {
340
+ "content": "DEP",
341
+ "lstrip": false,
342
+ "normalized": false,
343
+ "rstrip": false,
344
+ "single_word": false,
345
+ "special": true
346
+ },
347
+ "82244": {
348
+ "content": "GPU",
349
+ "lstrip": false,
350
+ "normalized": false,
351
+ "rstrip": false,
352
+ "single_word": false,
353
+ "special": true
354
+ },
355
+ "84526": {
356
+ "content": "POR",
357
+ "lstrip": false,
358
+ "normalized": false,
359
+ "rstrip": false,
360
+ "single_word": false,
361
+ "special": true
362
+ },
363
+ "86154": {
364
+ "content": "IID",
365
+ "lstrip": false,
366
+ "normalized": false,
367
+ "rstrip": false,
368
+ "single_word": false,
369
+ "special": true
370
+ },
371
+ "86297": {
372
+ "content": "CSI",
373
+ "lstrip": false,
374
+ "normalized": false,
375
+ "rstrip": false,
376
+ "single_word": false,
377
+ "special": true
378
+ },
379
+ "93660": {
380
+ "content": "ACL",
381
+ "lstrip": false,
382
+ "normalized": false,
383
+ "rstrip": false,
384
+ "single_word": false,
385
+ "special": true
386
+ },
387
+ "94432": {
388
+ "content": "TZ",
389
+ "lstrip": false,
390
+ "normalized": false,
391
+ "rstrip": false,
392
+ "single_word": false,
393
+ "special": true
394
+ },
395
+ "95202": {
396
+ "content": "SQ",
397
+ "lstrip": false,
398
+ "normalized": false,
399
+ "rstrip": false,
400
+ "single_word": false,
401
+ "special": true
402
+ },
403
+ "100413": {
404
+ "content": "PSC",
405
+ "lstrip": false,
406
+ "normalized": false,
407
+ "rstrip": false,
408
+ "single_word": false,
409
+ "special": true
410
+ },
411
+ "104755": {
412
+ "content": "DMA",
413
+ "lstrip": false,
414
+ "normalized": false,
415
+ "rstrip": false,
416
+ "single_word": false,
417
+ "special": true
418
+ },
419
+ "104805": {
420
+ "content": "BW",
421
+ "lstrip": false,
422
+ "normalized": false,
423
+ "rstrip": false,
424
+ "single_word": false,
425
+ "special": true
426
+ },
427
+ "106979": {
428
+ "content": "OTP",
429
+ "lstrip": false,
430
+ "normalized": false,
431
+ "rstrip": false,
432
+ "single_word": false,
433
+ "special": true
434
+ },
435
+ "110871": {
436
+ "content": "CRC",
437
+ "lstrip": false,
438
+ "normalized": false,
439
+ "rstrip": false,
440
+ "single_word": false,
441
+ "special": true
442
+ },
443
+ "117565": {
444
+ "content": "FPS",
445
+ "lstrip": false,
446
+ "normalized": false,
447
+ "rstrip": false,
448
+ "single_word": false,
449
+ "special": true
450
+ },
451
+ "118754": {
452
+ "content": "IPC",
453
+ "lstrip": false,
454
+ "normalized": false,
455
+ "rstrip": false,
456
+ "single_word": false,
457
+ "special": true
458
+ },
459
+ "126731": {
460
+ "content": "OEM",
461
+ "lstrip": false,
462
+ "normalized": false,
463
+ "rstrip": false,
464
+ "single_word": false,
465
+ "special": true
466
+ },
467
+ "126978": {
468
+ "content": "AES",
469
+ "lstrip": false,
470
+ "normalized": false,
471
+ "rstrip": false,
472
+ "single_word": false,
473
+ "special": true
474
+ },
475
+ "130911": {
476
+ "content": "RSA",
477
+ "lstrip": false,
478
+ "normalized": false,
479
+ "rstrip": false,
480
+ "single_word": false,
481
+ "special": true
482
+ },
483
+ "147130": {
484
+ "content": "CTR",
485
+ "lstrip": false,
486
+ "normalized": false,
487
+ "rstrip": false,
488
+ "single_word": false,
489
+ "special": true
490
+ },
491
+ "151336": {
492
+ "content": "OSP",
493
+ "lstrip": false,
494
+ "normalized": false,
495
+ "rstrip": false,
496
+ "single_word": false,
497
+ "special": true
498
+ },
499
+ "152076": {
500
+ "content": "IOC",
501
+ "lstrip": false,
502
+ "normalized": false,
503
+ "rstrip": false,
504
+ "single_word": false,
505
+ "special": true
506
+ },
507
+ "152095": {
508
+ "content": "SPA",
509
+ "lstrip": false,
510
+ "normalized": false,
511
+ "rstrip": false,
512
+ "single_word": false,
513
+ "special": true
514
+ },
515
+ "152119": {
516
+ "content": "CDD",
517
+ "lstrip": false,
518
+ "normalized": false,
519
+ "rstrip": false,
520
+ "single_word": false,
521
+ "special": true
522
+ },
523
+ "155474": {
524
+ "content": "SCH",
525
+ "lstrip": false,
526
+ "normalized": false,
527
+ "rstrip": false,
528
+ "single_word": false,
529
+ "special": true
530
+ },
531
+ "158359": {
532
+ "content": "ipc",
533
+ "lstrip": false,
534
+ "normalized": false,
535
+ "rstrip": false,
536
+ "single_word": false,
537
+ "special": true
538
+ },
539
+ "162121": {
540
+ "content": "PLA",
541
+ "lstrip": false,
542
+ "normalized": false,
543
+ "rstrip": false,
544
+ "single_word": false,
545
+ "special": true
546
+ },
547
+ "166996": {
548
+ "content": "CBC",
549
+ "lstrip": false,
550
+ "normalized": false,
551
+ "rstrip": false,
552
+ "single_word": false,
553
+ "special": true
554
+ },
555
+ "171893": {
556
+ "content": "DISPLAY",
557
+ "lstrip": false,
558
+ "normalized": false,
559
+ "rstrip": false,
560
+ "single_word": false,
561
+ "special": true
562
+ },
563
+ "172873": {
564
+ "content": "AAD",
565
+ "lstrip": false,
566
+ "normalized": false,
567
+ "rstrip": false,
568
+ "single_word": false,
569
+ "special": true
570
+ },
571
+ "175772": {
572
+ "content": "TEE",
573
+ "lstrip": false,
574
+ "normalized": false,
575
+ "rstrip": false,
576
+ "single_word": false,
577
+ "special": true
578
+ },
579
+ "177970": {
580
+ "content": "ECB",
581
+ "lstrip": false,
582
+ "normalized": false,
583
+ "rstrip": false,
584
+ "single_word": false,
585
+ "special": true
586
+ },
587
+ "178261": {
588
+ "content": "ECC",
589
+ "lstrip": false,
590
+ "normalized": false,
591
+ "rstrip": false,
592
+ "single_word": false,
593
+ "special": true
594
+ },
595
+ "178974": {
596
+ "content": "PCR",
597
+ "lstrip": false,
598
+ "normalized": false,
599
+ "rstrip": false,
600
+ "single_word": false,
601
+ "special": true
602
+ },
603
+ "186075": {
604
+ "content": "IPI",
605
+ "lstrip": false,
606
+ "normalized": false,
607
+ "rstrip": false,
608
+ "single_word": false,
609
+ "special": true
610
+ },
611
+ "187697": {
612
+ "content": "SSR",
613
+ "lstrip": false,
614
+ "normalized": false,
615
+ "rstrip": false,
616
+ "single_word": false,
617
+ "special": true
618
+ },
619
+ "199998": {
620
+ "content": "<|startoftext|>",
621
+ "lstrip": false,
622
+ "normalized": false,
623
+ "rstrip": false,
624
+ "single_word": false,
625
+ "special": true
626
+ },
627
+ "199999": {
628
+ "content": "<|endoftext|>",
629
+ "lstrip": false,
630
+ "normalized": false,
631
+ "rstrip": false,
632
+ "single_word": false,
633
+ "special": true
634
+ },
635
+ "200000": {
636
+ "content": "<|reserved_200000|>",
637
+ "lstrip": false,
638
+ "normalized": false,
639
+ "rstrip": false,
640
+ "single_word": false,
641
+ "special": true
642
+ },
643
+ "200001": {
644
+ "content": "<|reserved_200001|>",
645
+ "lstrip": false,
646
+ "normalized": false,
647
+ "rstrip": false,
648
+ "single_word": false,
649
+ "special": true
650
+ },
651
+ "200002": {
652
+ "content": "<|return|>",
653
+ "lstrip": false,
654
+ "normalized": false,
655
+ "rstrip": false,
656
+ "single_word": false,
657
+ "special": true
658
+ },
659
+ "200003": {
660
+ "content": "<|constrain|>",
661
+ "lstrip": false,
662
+ "normalized": false,
663
+ "rstrip": false,
664
+ "single_word": false,
665
+ "special": true
666
+ },
667
+ "200004": {
668
+ "content": "<|reserved_200004|>",
669
+ "lstrip": false,
670
+ "normalized": false,
671
+ "rstrip": false,
672
+ "single_word": false,
673
+ "special": true
674
+ },
675
+ "200005": {
676
+ "content": "<|channel|>",
677
+ "lstrip": false,
678
+ "normalized": false,
679
+ "rstrip": false,
680
+ "single_word": false,
681
+ "special": true
682
+ },
683
+ "200006": {
684
+ "content": "<|start|>",
685
+ "lstrip": false,
686
+ "normalized": false,
687
+ "rstrip": false,
688
+ "single_word": false,
689
+ "special": true
690
+ },
691
+ "200007": {
692
+ "content": "<|end|>",
693
+ "lstrip": false,
694
+ "normalized": false,
695
+ "rstrip": false,
696
+ "single_word": false,
697
+ "special": true
698
+ },
699
+ "200008": {
700
+ "content": "<|message|>",
701
+ "lstrip": false,
702
+ "normalized": false,
703
+ "rstrip": false,
704
+ "single_word": false,
705
+ "special": true
706
+ },
707
+ "200009": {
708
+ "content": "<|reserved_200009|>",
709
+ "lstrip": false,
710
+ "normalized": false,
711
+ "rstrip": false,
712
+ "single_word": false,
713
+ "special": true
714
+ },
715
+ "200010": {
716
+ "content": "<|reserved_200010|>",
717
+ "lstrip": false,
718
+ "normalized": false,
719
+ "rstrip": false,
720
+ "single_word": false,
721
+ "special": true
722
+ },
723
+ "200011": {
724
+ "content": "<|reserved_200011|>",
725
+ "lstrip": false,
726
+ "normalized": false,
727
+ "rstrip": false,
728
+ "single_word": false,
729
+ "special": true
730
+ },
731
+ "200012": {
732
+ "content": "<|call|>",
733
+ "lstrip": false,
734
+ "normalized": false,
735
+ "rstrip": false,
736
+ "single_word": false,
737
+ "special": true
738
+ },
739
+ "200013": {
740
+ "content": "<|reserved_200013|>",
741
+ "lstrip": false,
742
+ "normalized": false,
743
+ "rstrip": false,
744
+ "single_word": false,
745
+ "special": true
746
+ },
747
+ "200014": {
748
+ "content": "<|reserved_200014|>",
749
+ "lstrip": false,
750
+ "normalized": false,
751
+ "rstrip": false,
752
+ "single_word": false,
753
+ "special": true
754
+ },
755
+ "200015": {
756
+ "content": "<|reserved_200015|>",
757
+ "lstrip": false,
758
+ "normalized": false,
759
+ "rstrip": false,
760
+ "single_word": false,
761
+ "special": true
762
+ },
763
+ "200016": {
764
+ "content": "<|reserved_200016|>",
765
+ "lstrip": false,
766
+ "normalized": false,
767
+ "rstrip": false,
768
+ "single_word": false,
769
+ "special": true
770
+ },
771
+ "200017": {
772
+ "content": "<|reserved_200017|>",
773
+ "lstrip": false,
774
+ "normalized": false,
775
+ "rstrip": false,
776
+ "single_word": false,
777
+ "special": true
778
+ },
779
+ "200018": {
780
+ "content": "<|endofprompt|>",
781
+ "lstrip": false,
782
+ "normalized": false,
783
+ "rstrip": false,
784
+ "single_word": false,
785
+ "special": true
786
+ },
787
+ "200019": {
788
+ "content": "AArch64",
789
+ "lstrip": false,
790
+ "normalized": false,
791
+ "rstrip": false,
792
+ "single_word": false,
793
+ "special": true
794
+ },
795
+ "200020": {
796
+ "content": "AES256GCM",
797
+ "lstrip": false,
798
+ "normalized": false,
799
+ "rstrip": false,
800
+ "single_word": false,
801
+ "special": true
802
+ },
803
+ "200021": {
804
+ "content": "AESCBC",
805
+ "lstrip": false,
806
+ "normalized": false,
807
+ "rstrip": false,
808
+ "single_word": false,
809
+ "special": true
810
+ },
811
+ "200022": {
812
+ "content": "AON",
813
+ "lstrip": false,
814
+ "normalized": false,
815
+ "rstrip": false,
816
+ "single_word": false,
817
+ "special": true
818
+ },
819
+ "200023": {
820
+ "content": "ASID",
821
+ "lstrip": false,
822
+ "normalized": false,
823
+ "rstrip": false,
824
+ "single_word": false,
825
+ "special": true
826
+ },
827
+ "200024": {
828
+ "content": "AXI",
829
+ "lstrip": false,
830
+ "normalized": false,
831
+ "rstrip": false,
832
+ "single_word": false,
833
+ "special": true
834
+ },
835
+ "200025": {
836
+ "content": "Acronym",
837
+ "lstrip": false,
838
+ "normalized": false,
839
+ "rstrip": false,
840
+ "single_word": false,
841
+ "special": true
842
+ },
843
+ "200026": {
844
+ "content": "AoU",
845
+ "lstrip": false,
846
+ "normalized": false,
847
+ "rstrip": false,
848
+ "single_word": false,
849
+ "special": true
850
+ },
851
+ "200027": {
852
+ "content": "AutoSar",
853
+ "lstrip": false,
854
+ "normalized": false,
855
+ "rstrip": false,
856
+ "single_word": false,
857
+ "special": true
858
+ },
859
+ "200028": {
860
+ "content": "BAM",
861
+ "lstrip": false,
862
+ "normalized": false,
863
+ "rstrip": false,
864
+ "single_word": false,
865
+ "special": true
866
+ },
867
+ "200029": {
868
+ "content": "BCH",
869
+ "lstrip": false,
870
+ "normalized": false,
871
+ "rstrip": false,
872
+ "single_word": false,
873
+ "special": true
874
+ },
875
+ "200030": {
876
+ "content": "BIST",
877
+ "lstrip": false,
878
+ "normalized": false,
879
+ "rstrip": false,
880
+ "single_word": false,
881
+ "special": true
882
+ },
883
+ "200031": {
884
+ "content": "BOM",
885
+ "lstrip": false,
886
+ "normalized": false,
887
+ "rstrip": false,
888
+ "single_word": false,
889
+ "special": true
890
+ },
891
+ "200032": {
892
+ "content": "BPMP",
893
+ "lstrip": false,
894
+ "normalized": false,
895
+ "rstrip": false,
896
+ "single_word": false,
897
+ "special": true
898
+ },
899
+ "200033": {
900
+ "content": "BPS",
901
+ "lstrip": false,
902
+ "normalized": false,
903
+ "rstrip": false,
904
+ "single_word": false,
905
+ "special": true
906
+ },
907
+ "200034": {
908
+ "content": "BPU",
909
+ "lstrip": false,
910
+ "normalized": false,
911
+ "rstrip": false,
912
+ "single_word": false,
913
+ "special": true
914
+ },
915
+ "200035": {
916
+ "content": "BRBCT",
917
+ "lstrip": false,
918
+ "normalized": false,
919
+ "rstrip": false,
920
+ "single_word": false,
921
+ "special": true
922
+ },
923
+ "200036": {
924
+ "content": "C2C",
925
+ "lstrip": false,
926
+ "normalized": false,
927
+ "rstrip": false,
928
+ "single_word": false,
929
+ "special": true
930
+ },
931
+ "200037": {
932
+ "content": "CANFD",
933
+ "lstrip": false,
934
+ "normalized": false,
935
+ "rstrip": false,
936
+ "single_word": false,
937
+ "special": true
938
+ },
939
+ "200038": {
940
+ "content": "CAVP",
941
+ "lstrip": false,
942
+ "normalized": false,
943
+ "rstrip": false,
944
+ "single_word": false,
945
+ "special": true
946
+ },
947
+ "200039": {
948
+ "content": "CBB",
949
+ "lstrip": false,
950
+ "normalized": false,
951
+ "rstrip": false,
952
+ "single_word": false,
953
+ "special": true
954
+ },
955
+ "200040": {
956
+ "content": "CBR",
957
+ "lstrip": false,
958
+ "normalized": false,
959
+ "rstrip": false,
960
+ "single_word": false,
961
+ "special": true
962
+ },
963
+ "200041": {
964
+ "content": "CCM",
965
+ "lstrip": false,
966
+ "normalized": false,
967
+ "rstrip": false,
968
+ "single_word": false,
969
+ "special": true
970
+ },
971
+ "200042": {
972
+ "content": "CCPLEX",
973
+ "lstrip": false,
974
+ "normalized": false,
975
+ "rstrip": false,
976
+ "single_word": false,
977
+ "special": true
978
+ },
979
+ "200043": {
980
+ "content": "CCPLEX_L2",
981
+ "lstrip": false,
982
+ "normalized": false,
983
+ "rstrip": false,
984
+ "single_word": false,
985
+ "special": true
986
+ },
987
+ "200044": {
988
+ "content": "CCPLEX_MISC",
989
+ "lstrip": false,
990
+ "normalized": false,
991
+ "rstrip": false,
992
+ "single_word": false,
993
+ "special": true
994
+ },
995
+ "200045": {
996
+ "content": "CCPLEX_SCF",
997
+ "lstrip": false,
998
+ "normalized": false,
999
+ "rstrip": false,
1000
+ "single_word": false,
1001
+ "special": true
1002
+ },
1003
+ "200046": {
1004
+ "content": "CIF",
1005
+ "lstrip": false,
1006
+ "normalized": false,
1007
+ "rstrip": false,
1008
+ "single_word": false,
1009
+ "special": true
1010
+ },
1011
+ "200047": {
1012
+ "content": "CMAC",
1013
+ "lstrip": false,
1014
+ "normalized": false,
1015
+ "rstrip": false,
1016
+ "single_word": false,
1017
+ "special": true
1018
+ },
1019
+ "200048": {
1020
+ "content": "CPE",
1021
+ "lstrip": false,
1022
+ "normalized": false,
1023
+ "rstrip": false,
1024
+ "single_word": false,
1025
+ "special": true
1026
+ },
1027
+ "200049": {
1028
+ "content": "CSP",
1029
+ "lstrip": false,
1030
+ "normalized": false,
1031
+ "rstrip": false,
1032
+ "single_word": false,
1033
+ "special": true
1034
+ },
1035
+ "200050": {
1036
+ "content": "CTXT",
1037
+ "lstrip": false,
1038
+ "normalized": false,
1039
+ "rstrip": false,
1040
+ "single_word": false,
1041
+ "special": true
1042
+ },
1043
+ "200051": {
1044
+ "content": "DBB",
1045
+ "lstrip": false,
1046
+ "normalized": false,
1047
+ "rstrip": false,
1048
+ "single_word": false,
1049
+ "special": true
1050
+ },
1051
+ "200052": {
1052
+ "content": "DFA",
1053
+ "lstrip": false,
1054
+ "normalized": false,
1055
+ "rstrip": false,
1056
+ "single_word": false,
1057
+ "special": true
1058
+ },
1059
+ "200053": {
1060
+ "content": "DFT",
1061
+ "lstrip": false,
1062
+ "normalized": false,
1063
+ "rstrip": false,
1064
+ "single_word": false,
1065
+ "special": true
1066
+ },
1067
+ "200054": {
1068
+ "content": "DIP",
1069
+ "lstrip": false,
1070
+ "normalized": false,
1071
+ "rstrip": false,
1072
+ "single_word": false,
1073
+ "special": true
1074
+ },
1075
+ "200055": {
1076
+ "content": "DLA",
1077
+ "lstrip": false,
1078
+ "normalized": false,
1079
+ "rstrip": false,
1080
+ "single_word": false,
1081
+ "special": true
1082
+ },
1083
+ "200056": {
1084
+ "content": "DMEM",
1085
+ "lstrip": false,
1086
+ "normalized": false,
1087
+ "rstrip": false,
1088
+ "single_word": false,
1089
+ "special": true
1090
+ },
1091
+ "200057": {
1092
+ "content": "DPA",
1093
+ "lstrip": false,
1094
+ "normalized": false,
1095
+ "rstrip": false,
1096
+ "single_word": false,
1097
+ "special": true
1098
+ },
1099
+ "200058": {
1100
+ "content": "DSC",
1101
+ "lstrip": false,
1102
+ "normalized": false,
1103
+ "rstrip": false,
1104
+ "single_word": false,
1105
+ "special": true
1106
+ },
1107
+ "200059": {
1108
+ "content": "DVMU",
1109
+ "lstrip": false,
1110
+ "normalized": false,
1111
+ "rstrip": false,
1112
+ "single_word": false,
1113
+ "special": true
1114
+ },
1115
+ "200060": {
1116
+ "content": "ECDHE",
1117
+ "lstrip": false,
1118
+ "normalized": false,
1119
+ "rstrip": false,
1120
+ "single_word": false,
1121
+ "special": true
1122
+ },
1123
+ "200061": {
1124
+ "content": "ECDSA",
1125
+ "lstrip": false,
1126
+ "normalized": false,
1127
+ "rstrip": false,
1128
+ "single_word": false,
1129
+ "special": true
1130
+ },
1131
+ "200062": {
1132
+ "content": "ECID",
1133
+ "lstrip": false,
1134
+ "normalized": false,
1135
+ "rstrip": false,
1136
+ "single_word": false,
1137
+ "special": true
1138
+ },
1139
+ "200063": {
1140
+ "content": "EDR",
1141
+ "lstrip": false,
1142
+ "normalized": false,
1143
+ "rstrip": false,
1144
+ "single_word": false,
1145
+ "special": true
1146
+ },
1147
+ "200064": {
1148
+ "content": "EOTTI",
1149
+ "lstrip": false,
1150
+ "normalized": false,
1151
+ "rstrip": false,
1152
+ "single_word": false,
1153
+ "special": true
1154
+ },
1155
+ "200065": {
1156
+ "content": "EQoS",
1157
+ "lstrip": false,
1158
+ "normalized": false,
1159
+ "rstrip": false,
1160
+ "single_word": false,
1161
+ "special": true
1162
+ },
1163
+ "200066": {
1164
+ "content": "FCL",
1165
+ "lstrip": false,
1166
+ "normalized": false,
1167
+ "rstrip": false,
1168
+ "single_word": false,
1169
+ "special": true
1170
+ },
1171
+ "200067": {
1172
+ "content": "FHTI",
1173
+ "lstrip": false,
1174
+ "normalized": false,
1175
+ "rstrip": false,
1176
+ "single_word": false,
1177
+ "special": true
1178
+ },
1179
+ "200068": {
1180
+ "content": "FIPS",
1181
+ "lstrip": false,
1182
+ "normalized": false,
1183
+ "rstrip": false,
1184
+ "single_word": false,
1185
+ "special": true
1186
+ },
1187
+ "200069": {
1188
+ "content": "FMEA",
1189
+ "lstrip": false,
1190
+ "normalized": false,
1191
+ "rstrip": false,
1192
+ "single_word": false,
1193
+ "special": true
1194
+ },
1195
+ "200070": {
1196
+ "content": "FMON",
1197
+ "lstrip": false,
1198
+ "normalized": false,
1199
+ "rstrip": false,
1200
+ "single_word": false,
1201
+ "special": true
1202
+ },
1203
+ "200071": {
1204
+ "content": "FuSa",
1205
+ "lstrip": false,
1206
+ "normalized": false,
1207
+ "rstrip": false,
1208
+ "single_word": false,
1209
+ "special": true
1210
+ },
1211
+ "200072": {
1212
+ "content": "GCM",
1213
+ "lstrip": false,
1214
+ "normalized": false,
1215
+ "rstrip": false,
1216
+ "single_word": false,
1217
+ "special": true
1218
+ },
1219
+ "200073": {
1220
+ "content": "GFD",
1221
+ "lstrip": false,
1222
+ "normalized": false,
1223
+ "rstrip": false,
1224
+ "single_word": false,
1225
+ "special": true
1226
+ },
1227
+ "200074": {
1228
+ "content": "GIC",
1229
+ "lstrip": false,
1230
+ "normalized": false,
1231
+ "rstrip": false,
1232
+ "single_word": false,
1233
+ "special": true
1234
+ },
1235
+ "200075": {
1236
+ "content": "GMAC",
1237
+ "lstrip": false,
1238
+ "normalized": false,
1239
+ "rstrip": false,
1240
+ "single_word": false,
1241
+ "special": true
1242
+ },
1243
+ "200076": {
1244
+ "content": "GMSL",
1245
+ "lstrip": false,
1246
+ "normalized": false,
1247
+ "rstrip": false,
1248
+ "single_word": false,
1249
+ "special": true
1250
+ },
1251
+ "200077": {
1252
+ "content": "GOP",
1253
+ "lstrip": false,
1254
+ "normalized": false,
1255
+ "rstrip": false,
1256
+ "single_word": false,
1257
+ "special": true
1258
+ },
1259
+ "200078": {
1260
+ "content": "GPCDMA",
1261
+ "lstrip": false,
1262
+ "normalized": false,
1263
+ "rstrip": false,
1264
+ "single_word": false,
1265
+ "special": true
1266
+ },
1267
+ "200079": {
1268
+ "content": "Gpps",
1269
+ "lstrip": false,
1270
+ "normalized": false,
1271
+ "rstrip": false,
1272
+ "single_word": false,
1273
+ "special": true
1274
+ },
1275
+ "200080": {
1276
+ "content": "HBR",
1277
+ "lstrip": false,
1278
+ "normalized": false,
1279
+ "rstrip": false,
1280
+ "single_word": false,
1281
+ "special": true
1282
+ },
1283
+ "200081": {
1284
+ "content": "HBR2",
1285
+ "lstrip": false,
1286
+ "normalized": false,
1287
+ "rstrip": false,
1288
+ "single_word": false,
1289
+ "special": true
1290
+ },
1291
+ "200082": {
1292
+ "content": "HBR3",
1293
+ "lstrip": false,
1294
+ "normalized": false,
1295
+ "rstrip": false,
1296
+ "single_word": false,
1297
+ "special": true
1298
+ },
1299
+ "200083": {
1300
+ "content": "HDS",
1301
+ "lstrip": false,
1302
+ "normalized": false,
1303
+ "rstrip": false,
1304
+ "single_word": false,
1305
+ "special": true
1306
+ },
1307
+ "200084": {
1308
+ "content": "HIS",
1309
+ "lstrip": false,
1310
+ "normalized": false,
1311
+ "rstrip": false,
1312
+ "single_word": false,
1313
+ "special": true
1314
+ },
1315
+ "200085": {
1316
+ "content": "HMAC",
1317
+ "lstrip": false,
1318
+ "normalized": false,
1319
+ "rstrip": false,
1320
+ "single_word": false,
1321
+ "special": true
1322
+ },
1323
+ "200086": {
1324
+ "content": "HPSE",
1325
+ "lstrip": false,
1326
+ "normalized": false,
1327
+ "rstrip": false,
1328
+ "single_word": false,
1329
+ "special": true
1330
+ },
1331
+ "200087": {
1332
+ "content": "HSI",
1333
+ "lstrip": false,
1334
+ "normalized": false,
1335
+ "rstrip": false,
1336
+ "single_word": false,
1337
+ "special": true
1338
+ },
1339
+ "200088": {
1340
+ "content": "HSM",
1341
+ "lstrip": false,
1342
+ "normalized": false,
1343
+ "rstrip": false,
1344
+ "single_word": false,
1345
+ "special": true
1346
+ },
1347
+ "200089": {
1348
+ "content": "HSP",
1349
+ "lstrip": false,
1350
+ "normalized": false,
1351
+ "rstrip": false,
1352
+ "single_word": false,
1353
+ "special": true
1354
+ },
1355
+ "200090": {
1356
+ "content": "ICD",
1357
+ "lstrip": false,
1358
+ "normalized": false,
1359
+ "rstrip": false,
1360
+ "single_word": false,
1361
+ "special": true
1362
+ },
1363
+ "200091": {
1364
+ "content": "IDR",
1365
+ "lstrip": false,
1366
+ "normalized": false,
1367
+ "rstrip": false,
1368
+ "single_word": false,
1369
+ "special": true
1370
+ },
1371
+ "200092": {
1372
+ "content": "IDT",
1373
+ "lstrip": false,
1374
+ "normalized": false,
1375
+ "rstrip": false,
1376
+ "single_word": false,
1377
+ "special": true
1378
+ },
1379
+ "200093": {
1380
+ "content": "IEP",
1381
+ "lstrip": false,
1382
+ "normalized": false,
1383
+ "rstrip": false,
1384
+ "single_word": false,
1385
+ "special": true
1386
+ },
1387
+ "200094": {
1388
+ "content": "IEU",
1389
+ "lstrip": false,
1390
+ "normalized": false,
1391
+ "rstrip": false,
1392
+ "single_word": false,
1393
+ "special": true
1394
+ },
1395
+ "200095": {
1396
+ "content": "IFU",
1397
+ "lstrip": false,
1398
+ "normalized": false,
1399
+ "rstrip": false,
1400
+ "single_word": false,
1401
+ "special": true
1402
+ },
1403
+ "200096": {
1404
+ "content": "IMEM",
1405
+ "lstrip": false,
1406
+ "normalized": false,
1407
+ "rstrip": false,
1408
+ "single_word": false,
1409
+ "special": true
1410
+ },
1411
+ "200097": {
1412
+ "content": "IOFA",
1413
+ "lstrip": false,
1414
+ "normalized": false,
1415
+ "rstrip": false,
1416
+ "single_word": false,
1417
+ "special": true
1418
+ },
1419
+ "200098": {
1420
+ "content": "IOMMU",
1421
+ "lstrip": false,
1422
+ "normalized": false,
1423
+ "rstrip": false,
1424
+ "single_word": false,
1425
+ "special": true
1426
+ },
1427
+ "200099": {
1428
+ "content": "IRF",
1429
+ "lstrip": false,
1430
+ "normalized": false,
1431
+ "rstrip": false,
1432
+ "single_word": false,
1433
+ "special": true
1434
+ },
1435
+ "200100": {
1436
+ "content": "IoT",
1437
+ "lstrip": false,
1438
+ "normalized": false,
1439
+ "rstrip": false,
1440
+ "single_word": false,
1441
+ "special": true
1442
+ },
1443
+ "200101": {
1444
+ "content": "JSR",
1445
+ "lstrip": false,
1446
+ "normalized": false,
1447
+ "rstrip": false,
1448
+ "single_word": false,
1449
+ "special": true
1450
+ },
1451
+ "200102": {
1452
+ "content": "KAT",
1453
+ "lstrip": false,
1454
+ "normalized": false,
1455
+ "rstrip": false,
1456
+ "single_word": false,
1457
+ "special": true
1458
+ },
1459
+ "200103": {
1460
+ "content": "KCV",
1461
+ "lstrip": false,
1462
+ "normalized": false,
1463
+ "rstrip": false,
1464
+ "single_word": false,
1465
+ "special": true
1466
+ },
1467
+ "200104": {
1468
+ "content": "KDF",
1469
+ "lstrip": false,
1470
+ "normalized": false,
1471
+ "rstrip": false,
1472
+ "single_word": false,
1473
+ "special": true
1474
+ },
1475
+ "200105": {
1476
+ "content": "KPI",
1477
+ "lstrip": false,
1478
+ "normalized": false,
1479
+ "rstrip": false,
1480
+ "single_word": false,
1481
+ "special": true
1482
+ },
1483
+ "200106": {
1484
+ "content": "L1PT",
1485
+ "lstrip": false,
1486
+ "normalized": false,
1487
+ "rstrip": false,
1488
+ "single_word": false,
1489
+ "special": true
1490
+ },
1491
+ "200107": {
1492
+ "content": "L2C",
1493
+ "lstrip": false,
1494
+ "normalized": false,
1495
+ "rstrip": false,
1496
+ "single_word": false,
1497
+ "special": true
1498
+ },
1499
+ "200108": {
1500
+ "content": "L2mDIR",
1501
+ "lstrip": false,
1502
+ "normalized": false,
1503
+ "rstrip": false,
1504
+ "single_word": false,
1505
+ "special": true
1506
+ },
1507
+ "200109": {
1508
+ "content": "L2vDIR",
1509
+ "lstrip": false,
1510
+ "normalized": false,
1511
+ "rstrip": false,
1512
+ "single_word": false,
1513
+ "special": true
1514
+ },
1515
+ "200110": {
1516
+ "content": "LBIST",
1517
+ "lstrip": false,
1518
+ "normalized": false,
1519
+ "rstrip": false,
1520
+ "single_word": false,
1521
+ "special": true
1522
+ },
1523
+ "200111": {
1524
+ "content": "LDC",
1525
+ "lstrip": false,
1526
+ "normalized": false,
1527
+ "rstrip": false,
1528
+ "single_word": false,
1529
+ "special": true
1530
+ },
1531
+ "200112": {
1532
+ "content": "LFT",
1533
+ "lstrip": false,
1534
+ "normalized": false,
1535
+ "rstrip": false,
1536
+ "single_word": false,
1537
+ "special": true
1538
+ },
1539
+ "200113": {
1540
+ "content": "LIP",
1541
+ "lstrip": false,
1542
+ "normalized": false,
1543
+ "rstrip": false,
1544
+ "single_word": false,
1545
+ "special": true
1546
+ },
1547
+ "200114": {
1548
+ "content": "LSB",
1549
+ "lstrip": false,
1550
+ "normalized": false,
1551
+ "rstrip": false,
1552
+ "single_word": false,
1553
+ "special": true
1554
+ },
1555
+ "200115": {
1556
+ "content": "MAQ",
1557
+ "lstrip": false,
1558
+ "normalized": false,
1559
+ "rstrip": false,
1560
+ "single_word": false,
1561
+ "special": true
1562
+ },
1563
+ "200116": {
1564
+ "content": "MBIST",
1565
+ "lstrip": false,
1566
+ "normalized": false,
1567
+ "rstrip": false,
1568
+ "single_word": false,
1569
+ "special": true
1570
+ },
1571
+ "200117": {
1572
+ "content": "MCAL",
1573
+ "lstrip": false,
1574
+ "normalized": false,
1575
+ "rstrip": false,
1576
+ "single_word": false,
1577
+ "special": true
1578
+ },
1579
+ "200118": {
1580
+ "content": "MCE",
1581
+ "lstrip": false,
1582
+ "normalized": false,
1583
+ "rstrip": false,
1584
+ "single_word": false,
1585
+ "special": true
1586
+ },
1587
+ "200119": {
1588
+ "content": "MCU",
1589
+ "lstrip": false,
1590
+ "normalized": false,
1591
+ "rstrip": false,
1592
+ "single_word": false,
1593
+ "special": true
1594
+ },
1595
+ "200120": {
1596
+ "content": "MSB",
1597
+ "lstrip": false,
1598
+ "normalized": false,
1599
+ "rstrip": false,
1600
+ "single_word": false,
1601
+ "special": true
1602
+ },
1603
+ "200121": {
1604
+ "content": "MSS",
1605
+ "lstrip": false,
1606
+ "normalized": false,
1607
+ "rstrip": false,
1608
+ "single_word": false,
1609
+ "special": true
1610
+ },
1611
+ "200122": {
1612
+ "content": "MST",
1613
+ "lstrip": false,
1614
+ "normalized": false,
1615
+ "rstrip": false,
1616
+ "single_word": false,
1617
+ "special": true
1618
+ },
1619
+ "200123": {
1620
+ "content": "MTS",
1621
+ "lstrip": false,
1622
+ "normalized": false,
1623
+ "rstrip": false,
1624
+ "single_word": false,
1625
+ "special": true
1626
+ },
1627
+ "200124": {
1628
+ "content": "MiTM",
1629
+ "lstrip": false,
1630
+ "normalized": false,
1631
+ "rstrip": false,
1632
+ "single_word": false,
1633
+ "special": true
1634
+ },
1635
+ "200125": {
1636
+ "content": "NIP",
1637
+ "lstrip": false,
1638
+ "normalized": false,
1639
+ "rstrip": false,
1640
+ "single_word": false,
1641
+ "special": true
1642
+ },
1643
+ "200126": {
1644
+ "content": "NIST",
1645
+ "lstrip": false,
1646
+ "normalized": false,
1647
+ "rstrip": false,
1648
+ "single_word": false,
1649
+ "special": true
1650
+ },
1651
+ "200127": {
1652
+ "content": "NITO",
1653
+ "lstrip": false,
1654
+ "normalized": false,
1655
+ "rstrip": false,
1656
+ "single_word": false,
1657
+ "special": true
1658
+ },
1659
+ "200128": {
1660
+ "content": "NOC",
1661
+ "lstrip": false,
1662
+ "normalized": false,
1663
+ "rstrip": false,
1664
+ "single_word": false,
1665
+ "special": true
1666
+ },
1667
+ "200129": {
1668
+ "content": "NOOP",
1669
+ "lstrip": false,
1670
+ "normalized": false,
1671
+ "rstrip": false,
1672
+ "single_word": false,
1673
+ "special": true
1674
+ },
1675
+ "200130": {
1676
+ "content": "NVDEC",
1677
+ "lstrip": false,
1678
+ "normalized": false,
1679
+ "rstrip": false,
1680
+ "single_word": false,
1681
+ "special": true
1682
+ },
1683
+ "200131": {
1684
+ "content": "NVENC",
1685
+ "lstrip": false,
1686
+ "normalized": false,
1687
+ "rstrip": false,
1688
+ "single_word": false,
1689
+ "special": true
1690
+ },
1691
+ "200132": {
1692
+ "content": "NVJPG",
1693
+ "lstrip": false,
1694
+ "normalized": false,
1695
+ "rstrip": false,
1696
+ "single_word": false,
1697
+ "special": true
1698
+ },
1699
+ "200133": {
1700
+ "content": "NVM",
1701
+ "lstrip": false,
1702
+ "normalized": false,
1703
+ "rstrip": false,
1704
+ "single_word": false,
1705
+ "special": true
1706
+ },
1707
+ "200134": {
1708
+ "content": "NVVSE",
1709
+ "lstrip": false,
1710
+ "normalized": false,
1711
+ "rstrip": false,
1712
+ "single_word": false,
1713
+ "special": true
1714
+ },
1715
+ "200135": {
1716
+ "content": "OFA",
1717
+ "lstrip": false,
1718
+ "normalized": false,
1719
+ "rstrip": false,
1720
+ "single_word": false,
1721
+ "special": true
1722
+ },
1723
+ "200136": {
1724
+ "content": "PCIE",
1725
+ "lstrip": false,
1726
+ "normalized": false,
1727
+ "rstrip": false,
1728
+ "single_word": false,
1729
+ "special": true
1730
+ },
1731
+ "200137": {
1732
+ "content": "PCPU",
1733
+ "lstrip": false,
1734
+ "normalized": false,
1735
+ "rstrip": false,
1736
+ "single_word": false,
1737
+ "special": true
1738
+ },
1739
+ "200138": {
1740
+ "content": "PCT",
1741
+ "lstrip": false,
1742
+ "normalized": false,
1743
+ "rstrip": false,
1744
+ "single_word": false,
1745
+ "special": true
1746
+ },
1747
+ "200139": {
1748
+ "content": "PDK",
1749
+ "lstrip": false,
1750
+ "normalized": false,
1751
+ "rstrip": false,
1752
+ "single_word": false,
1753
+ "special": true
1754
+ },
1755
+ "200140": {
1756
+ "content": "PII",
1757
+ "lstrip": false,
1758
+ "normalized": false,
1759
+ "rstrip": false,
1760
+ "single_word": false,
1761
+ "special": true
1762
+ },
1763
+ "200141": {
1764
+ "content": "PIP",
1765
+ "lstrip": false,
1766
+ "normalized": false,
1767
+ "rstrip": false,
1768
+ "single_word": false,
1769
+ "special": true
1770
+ },
1771
+ "200142": {
1772
+ "content": "PKC",
1773
+ "lstrip": false,
1774
+ "normalized": false,
1775
+ "rstrip": false,
1776
+ "single_word": false,
1777
+ "special": true
1778
+ },
1779
+ "200143": {
1780
+ "content": "PKCS",
1781
+ "lstrip": false,
1782
+ "normalized": false,
1783
+ "rstrip": false,
1784
+ "single_word": false,
1785
+ "special": true
1786
+ },
1787
+ "200144": {
1788
+ "content": "PKI",
1789
+ "lstrip": false,
1790
+ "normalized": false,
1791
+ "rstrip": false,
1792
+ "single_word": false,
1793
+ "special": true
1794
+ },
1795
+ "200145": {
1796
+ "content": "PPC",
1797
+ "lstrip": false,
1798
+ "normalized": false,
1799
+ "rstrip": false,
1800
+ "single_word": false,
1801
+ "special": true
1802
+ },
1803
+ "200146": {
1804
+ "content": "PTXT",
1805
+ "lstrip": false,
1806
+ "normalized": false,
1807
+ "rstrip": false,
1808
+ "single_word": false,
1809
+ "special": true
1810
+ },
1811
+ "200147": {
1812
+ "content": "PVA",
1813
+ "lstrip": false,
1814
+ "normalized": false,
1815
+ "rstrip": false,
1816
+ "single_word": false,
1817
+ "special": true
1818
+ },
1819
+ "200148": {
1820
+ "content": "QNX",
1821
+ "lstrip": false,
1822
+ "normalized": false,
1823
+ "rstrip": false,
1824
+ "single_word": false,
1825
+ "special": true
1826
+ },
1827
+ "200149": {
1828
+ "content": "QOS",
1829
+ "lstrip": false,
1830
+ "normalized": false,
1831
+ "rstrip": false,
1832
+ "single_word": false,
1833
+ "special": true
1834
+ },
1835
+ "200150": {
1836
+ "content": "QSPI",
1837
+ "lstrip": false,
1838
+ "normalized": false,
1839
+ "rstrip": false,
1840
+ "single_word": false,
1841
+ "special": true
1842
+ },
1843
+ "200151": {
1844
+ "content": "RBG",
1845
+ "lstrip": false,
1846
+ "normalized": false,
1847
+ "rstrip": false,
1848
+ "single_word": false,
1849
+ "special": true
1850
+ },
1851
+ "200152": {
1852
+ "content": "RBR",
1853
+ "lstrip": false,
1854
+ "normalized": false,
1855
+ "rstrip": false,
1856
+ "single_word": false,
1857
+ "special": true
1858
+ },
1859
+ "200153": {
1860
+ "content": "RDEV",
1861
+ "lstrip": false,
1862
+ "normalized": false,
1863
+ "rstrip": false,
1864
+ "single_word": false,
1865
+ "special": true
1866
+ },
1867
+ "200154": {
1868
+ "content": "RMA",
1869
+ "lstrip": false,
1870
+ "normalized": false,
1871
+ "rstrip": false,
1872
+ "single_word": false,
1873
+ "special": true
1874
+ },
1875
+ "200155": {
1876
+ "content": "RMW",
1877
+ "lstrip": false,
1878
+ "normalized": false,
1879
+ "rstrip": false,
1880
+ "single_word": false,
1881
+ "special": true
1882
+ },
1883
+ "200156": {
1884
+ "content": "RSB",
1885
+ "lstrip": false,
1886
+ "normalized": false,
1887
+ "rstrip": false,
1888
+ "single_word": false,
1889
+ "special": true
1890
+ },
1891
+ "200157": {
1892
+ "content": "RTS",
1893
+ "lstrip": false,
1894
+ "normalized": false,
1895
+ "rstrip": false,
1896
+ "single_word": false,
1897
+ "special": true
1898
+ },
1899
+ "200158": {
1900
+ "content": "RoT",
1901
+ "lstrip": false,
1902
+ "normalized": false,
1903
+ "rstrip": false,
1904
+ "single_word": false,
1905
+ "special": true
1906
+ },
1907
+ "200159": {
1908
+ "content": "SAE",
1909
+ "lstrip": false,
1910
+ "normalized": false,
1911
+ "rstrip": false,
1912
+ "single_word": false,
1913
+ "special": true
1914
+ },
1915
+ "200160": {
1916
+ "content": "SBK",
1917
+ "lstrip": false,
1918
+ "normalized": false,
1919
+ "rstrip": false,
1920
+ "single_word": false,
1921
+ "special": true
1922
+ },
1923
+ "200161": {
1924
+ "content": "SEL0",
1925
+ "lstrip": false,
1926
+ "normalized": false,
1927
+ "rstrip": false,
1928
+ "single_word": false,
1929
+ "special": true
1930
+ },
1931
+ "200162": {
1932
+ "content": "SEL1",
1933
+ "lstrip": false,
1934
+ "normalized": false,
1935
+ "rstrip": false,
1936
+ "single_word": false,
1937
+ "special": true
1938
+ },
1939
+ "200163": {
1940
+ "content": "SEooC",
1941
+ "lstrip": false,
1942
+ "normalized": false,
1943
+ "rstrip": false,
1944
+ "single_word": false,
1945
+ "special": true
1946
+ },
1947
+ "200164": {
1948
+ "content": "SGM",
1949
+ "lstrip": false,
1950
+ "normalized": false,
1951
+ "rstrip": false,
1952
+ "single_word": false,
1953
+ "special": true
1954
+ },
1955
+ "200165": {
1956
+ "content": "SHA256",
1957
+ "lstrip": false,
1958
+ "normalized": false,
1959
+ "rstrip": false,
1960
+ "single_word": false,
1961
+ "special": true
1962
+ },
1963
+ "200166": {
1964
+ "content": "SHA512",
1965
+ "lstrip": false,
1966
+ "normalized": false,
1967
+ "rstrip": false,
1968
+ "single_word": false,
1969
+ "special": true
1970
+ },
1971
+ "200167": {
1972
+ "content": "SHE",
1973
+ "lstrip": false,
1974
+ "normalized": false,
1975
+ "rstrip": false,
1976
+ "single_word": false,
1977
+ "special": true
1978
+ },
1979
+ "200168": {
1980
+ "content": "SNOC",
1981
+ "lstrip": false,
1982
+ "normalized": false,
1983
+ "rstrip": false,
1984
+ "single_word": false,
1985
+ "special": true
1986
+ },
1987
+ "200169": {
1988
+ "content": "SST",
1989
+ "lstrip": false,
1990
+ "normalized": false,
1991
+ "rstrip": false,
1992
+ "single_word": false,
1993
+ "special": true
1994
+ },
1995
+ "200170": {
1996
+ "content": "SWAT",
1997
+ "lstrip": false,
1998
+ "normalized": false,
1999
+ "rstrip": false,
2000
+ "single_word": false,
2001
+ "special": true
2002
+ },
2003
+ "200171": {
2004
+ "content": "SoC",
2005
+ "lstrip": false,
2006
+ "normalized": false,
2007
+ "rstrip": false,
2008
+ "single_word": false,
2009
+ "special": true
2010
+ },
2011
+ "200172": {
2012
+ "content": "TCF",
2013
+ "lstrip": false,
2014
+ "normalized": false,
2015
+ "rstrip": false,
2016
+ "single_word": false,
2017
+ "special": true
2018
+ },
2019
+ "200173": {
2020
+ "content": "THI",
2021
+ "lstrip": false,
2022
+ "normalized": false,
2023
+ "rstrip": false,
2024
+ "single_word": false,
2025
+ "special": true
2026
+ },
2027
+ "200174": {
2028
+ "content": "TNR",
2029
+ "lstrip": false,
2030
+ "normalized": false,
2031
+ "rstrip": false,
2032
+ "single_word": false,
2033
+ "special": true
2034
+ },
2035
+ "200175": {
2036
+ "content": "TOS",
2037
+ "lstrip": false,
2038
+ "normalized": false,
2039
+ "rstrip": false,
2040
+ "single_word": false,
2041
+ "special": true
2042
+ },
2043
+ "200176": {
2044
+ "content": "TRC",
2045
+ "lstrip": false,
2046
+ "normalized": false,
2047
+ "rstrip": false,
2048
+ "single_word": false,
2049
+ "special": true
2050
+ },
2051
+ "200177": {
2052
+ "content": "TSEC",
2053
+ "lstrip": false,
2054
+ "normalized": false,
2055
+ "rstrip": false,
2056
+ "single_word": false,
2057
+ "special": true
2058
+ },
2059
+ "200178": {
2060
+ "content": "UFS",
2061
+ "lstrip": false,
2062
+ "normalized": false,
2063
+ "rstrip": false,
2064
+ "single_word": false,
2065
+ "special": true
2066
+ },
2067
+ "200179": {
2068
+ "content": "VBR",
2069
+ "lstrip": false,
2070
+ "normalized": false,
2071
+ "rstrip": false,
2072
+ "single_word": false,
2073
+ "special": true
2074
+ },
2075
+ "200180": {
2076
+ "content": "VCPU",
2077
+ "lstrip": false,
2078
+ "normalized": false,
2079
+ "rstrip": false,
2080
+ "single_word": false,
2081
+ "special": true
2082
+ },
2083
+ "200181": {
2084
+ "content": "VIC",
2085
+ "lstrip": false,
2086
+ "normalized": false,
2087
+ "rstrip": false,
2088
+ "single_word": false,
2089
+ "special": true
2090
+ },
2091
+ "200182": {
2092
+ "content": "VMEM",
2093
+ "lstrip": false,
2094
+ "normalized": false,
2095
+ "rstrip": false,
2096
+ "single_word": false,
2097
+ "special": true
2098
+ },
2099
+ "200183": {
2100
+ "content": "VMID",
2101
+ "lstrip": false,
2102
+ "normalized": false,
2103
+ "rstrip": false,
2104
+ "single_word": false,
2105
+ "special": true
2106
+ },
2107
+ "200184": {
2108
+ "content": "VPU",
2109
+ "lstrip": false,
2110
+ "normalized": false,
2111
+ "rstrip": false,
2112
+ "single_word": false,
2113
+ "special": true
2114
+ },
2115
+ "200185": {
2116
+ "content": "VRC",
2117
+ "lstrip": false,
2118
+ "normalized": false,
2119
+ "rstrip": false,
2120
+ "single_word": false,
2121
+ "special": true
2122
+ },
2123
+ "200186": {
2124
+ "content": "VUI",
2125
+ "lstrip": false,
2126
+ "normalized": false,
2127
+ "rstrip": false,
2128
+ "single_word": false,
2129
+ "special": true
2130
+ },
2131
+ "200187": {
2132
+ "content": "WARB",
2133
+ "lstrip": false,
2134
+ "normalized": false,
2135
+ "rstrip": false,
2136
+ "single_word": false,
2137
+ "special": true
2138
+ },
2139
+ "200188": {
2140
+ "content": "XIP",
2141
+ "lstrip": false,
2142
+ "normalized": false,
2143
+ "rstrip": false,
2144
+ "single_word": false,
2145
+ "special": true
2146
+ },
2147
+ "200189": {
2148
+ "content": "bpp",
2149
+ "lstrip": false,
2150
+ "normalized": false,
2151
+ "rstrip": false,
2152
+ "single_word": false,
2153
+ "special": true
2154
+ },
2155
+ "200190": {
2156
+ "content": "eMMC",
2157
+ "lstrip": false,
2158
+ "normalized": false,
2159
+ "rstrip": false,
2160
+ "single_word": false,
2161
+ "special": true
2162
+ },
2163
+ "200191": {
2164
+ "content": "hfPLA",
2165
+ "lstrip": false,
2166
+ "normalized": false,
2167
+ "rstrip": false,
2168
+ "single_word": false,
2169
+ "special": true
2170
+ },
2171
+ "200192": {
2172
+ "content": "iGPU",
2173
+ "lstrip": false,
2174
+ "normalized": false,
2175
+ "rstrip": false,
2176
+ "single_word": false,
2177
+ "special": true
2178
+ },
2179
+ "200193": {
2180
+ "content": "ipc_fg",
2181
+ "lstrip": false,
2182
+ "normalized": false,
2183
+ "rstrip": false,
2184
+ "single_word": false,
2185
+ "special": true
2186
+ },
2187
+ "200194": {
2188
+ "content": "ipc_t",
2189
+ "lstrip": false,
2190
+ "normalized": false,
2191
+ "rstrip": false,
2192
+ "single_word": false,
2193
+ "special": true
2194
+ },
2195
+ "200195": {
2196
+ "content": "sbPLA",
2197
+ "lstrip": false,
2198
+ "normalized": false,
2199
+ "rstrip": false,
2200
+ "single_word": false,
2201
+ "special": true
2202
+ },
2203
+ "200196": {
2204
+ "content": "xBTV",
2205
+ "lstrip": false,
2206
+ "normalized": false,
2207
+ "rstrip": false,
2208
+ "single_word": false,
2209
+ "special": true
2210
+ },
2211
+ "200197": {
2212
+ "content": "xps",
2213
+ "lstrip": false,
2214
+ "normalized": false,
2215
+ "rstrip": false,
2216
+ "single_word": false,
2217
+ "special": true
2218
+ }
2219
+ },
2220
+ "additional_special_tokens": [
2221
+ "AAD",
2222
+ "AArch64",
2223
+ "ACL",
2224
+ "AD",
2225
+ "AES",
2226
+ "AES256GCM",
2227
+ "AESCBC",
2228
+ "AKE",
2229
+ "AON",
2230
+ "ASID",
2231
+ "AXI",
2232
+ "Acronym",
2233
+ "AoU",
2234
+ "AutoSar",
2235
+ "BAM",
2236
+ "BCH",
2237
+ "BIST",
2238
+ "BOM",
2239
+ "BPMP",
2240
+ "BPS",
2241
+ "BPU",
2242
+ "BRBCT",
2243
+ "BW",
2244
+ "C2C",
2245
+ "CA",
2246
+ "CAN",
2247
+ "CANFD",
2248
+ "CAR",
2249
+ "CAVP",
2250
+ "CBB",
2251
+ "CBC",
2252
+ "CBR",
2253
+ "CCM",
2254
+ "CCPLEX",
2255
+ "CCPLEX_L2",
2256
+ "CCPLEX_MISC",
2257
+ "CCPLEX_SCF",
2258
+ "CDD",
2259
+ "CIF",
2260
+ "CMAC",
2261
+ "CPE",
2262
+ "CPU",
2263
+ "CRC",
2264
+ "CSI",
2265
+ "CSP",
2266
+ "CTR",
2267
+ "CTXT",
2268
+ "CV",
2269
+ "DBB",
2270
+ "DEP",
2271
+ "DEV",
2272
+ "DFA",
2273
+ "DFT",
2274
+ "DIP",
2275
+ "DISPLAY",
2276
+ "DLA",
2277
+ "DMA",
2278
+ "DMEM",
2279
+ "DPA",
2280
+ "DSC",
2281
+ "DT",
2282
+ "DU",
2283
+ "DVMU",
2284
+ "EC",
2285
+ "ECB",
2286
+ "ECC",
2287
+ "ECDHE",
2288
+ "ECDSA",
2289
+ "ECID",
2290
+ "EDR",
2291
+ "EOF",
2292
+ "EOTTI",
2293
+ "EQoS",
2294
+ "FCL",
2295
+ "FHTI",
2296
+ "FIPS",
2297
+ "FMEA",
2298
+ "FMON",
2299
+ "FO",
2300
+ "FP",
2301
+ "FPS",
2302
+ "FW",
2303
+ "FuSa",
2304
+ "GCM",
2305
+ "GFD",
2306
+ "GIC",
2307
+ "GMAC",
2308
+ "GMSL",
2309
+ "GOP",
2310
+ "GP",
2311
+ "GPCDMA",
2312
+ "GPU",
2313
+ "GR",
2314
+ "Gpps",
2315
+ "HBR",
2316
+ "HBR2",
2317
+ "HBR3",
2318
+ "HDS",
2319
+ "HIS",
2320
+ "HMAC",
2321
+ "HPSE",
2322
+ "HSI",
2323
+ "HSM",
2324
+ "HSP",
2325
+ "HW",
2326
+ "IAS",
2327
+ "IC",
2328
+ "ICD",
2329
+ "IDR",
2330
+ "IDT",
2331
+ "IEP",
2332
+ "IEU",
2333
+ "IFU",
2334
+ "IID",
2335
+ "ILD",
2336
+ "IMEM",
2337
+ "IOC",
2338
+ "IOFA",
2339
+ "IOMMU",
2340
+ "IPC",
2341
+ "IPI",
2342
+ "IRF",
2343
+ "IST",
2344
+ "IV",
2345
+ "IoT",
2346
+ "JSR",
2347
+ "KAT",
2348
+ "KCV",
2349
+ "KDF",
2350
+ "KPI",
2351
+ "L1PT",
2352
+ "L2C",
2353
+ "L2mDIR",
2354
+ "L2vDIR",
2355
+ "LAB",
2356
+ "LBIST",
2357
+ "LDC",
2358
+ "LFT",
2359
+ "LIC",
2360
+ "LIP",
2361
+ "LSB",
2362
+ "MAC",
2363
+ "MAQ",
2364
+ "MB",
2365
+ "MBIST",
2366
+ "MCAL",
2367
+ "MCE",
2368
+ "MCU",
2369
+ "MSB",
2370
+ "MSS",
2371
+ "MST",
2372
+ "MTS",
2373
+ "MiTM",
2374
+ "NIP",
2375
+ "NIST",
2376
+ "NITO",
2377
+ "NOC",
2378
+ "NOOP",
2379
+ "NT",
2380
+ "NVDEC",
2381
+ "NVENC",
2382
+ "NVJPG",
2383
+ "NVM",
2384
+ "NVVSE",
2385
+ "OEM",
2386
+ "OFA",
2387
+ "OS",
2388
+ "OSP",
2389
+ "OTP",
2390
+ "PB",
2391
+ "PCIE",
2392
+ "PCPU",
2393
+ "PCR",
2394
+ "PCT",
2395
+ "PDK",
2396
+ "PII",
2397
+ "PIP",
2398
+ "PKC",
2399
+ "PKCS",
2400
+ "PKI",
2401
+ "PL",
2402
+ "PLA",
2403
+ "POR",
2404
+ "PPC",
2405
+ "PSC",
2406
+ "PTXT",
2407
+ "PVA",
2408
+ "QNX",
2409
+ "QOS",
2410
+ "QSPI",
2411
+ "RBG",
2412
+ "RBR",
2413
+ "RC",
2414
+ "RDEV",
2415
+ "REE",
2416
+ "RMA",
2417
+ "RMW",
2418
+ "RSA",
2419
+ "RSB",
2420
+ "RTS",
2421
+ "RoT",
2422
+ "SAE",
2423
+ "SBK",
2424
+ "SCH",
2425
+ "SDK",
2426
+ "SE",
2427
+ "SEL0",
2428
+ "SEL1",
2429
+ "SEooC",
2430
+ "SGM",
2431
+ "SHA",
2432
+ "SHA256",
2433
+ "SHA512",
2434
+ "SHE",
2435
+ "SKU",
2436
+ "SNOC",
2437
+ "SO",
2438
+ "SPA",
2439
+ "SQ",
2440
+ "SSR",
2441
+ "SST",
2442
+ "SW",
2443
+ "SWAT",
2444
+ "SoC",
2445
+ "TA",
2446
+ "TCF",
2447
+ "TEE",
2448
+ "THI",
2449
+ "TNR",
2450
+ "TOS",
2451
+ "TRC",
2452
+ "TRL",
2453
+ "TSEC",
2454
+ "TZ",
2455
+ "UFS",
2456
+ "VBR",
2457
+ "VCPU",
2458
+ "VI",
2459
+ "VIC",
2460
+ "VMEM",
2461
+ "VMID",
2462
+ "VPU",
2463
+ "VRC",
2464
+ "VUI",
2465
+ "WARB",
2466
+ "XIP",
2467
+ "bpp",
2468
+ "eMMC",
2469
+ "hfPLA",
2470
+ "iGPU",
2471
+ "ipc",
2472
+ "ipc_fg",
2473
+ "ipc_t",
2474
+ "sbPLA",
2475
+ "xBTV",
2476
+ "xps"
2477
+ ],
2478
+ "bos_token": "<|startoftext|>",
2479
+ "clean_up_tokenization_spaces": false,
2480
+ "eos_token": "<|return|>",
2481
+ "extra_special_tokens": {},
2482
+ "model_input_names": [
2483
+ "input_ids",
2484
+ "attention_mask"
2485
+ ],
2486
+ "model_max_length": 1000000000000000019884624838656,
2487
+ "pad_token": "<|endoftext|>",
2488
+ "tokenizer_class": "PreTrainedTokenizerFast"
2489
+ }
checkpoint-1642/trainer_state.json ADDED
@@ -0,0 +1,1510 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 1.0,
6
+ "eval_steps": 500,
7
+ "global_step": 1642,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.0060901339829476245,
14
+ "grad_norm": 23.5319766998291,
15
+ "learning_rate": 1.2162162162162164e-05,
16
+ "loss": 4.5905,
17
+ "mean_token_accuracy": 0.3401473943144083,
18
+ "num_tokens": 132681.0,
19
+ "step": 10
20
+ },
21
+ {
22
+ "epoch": 0.012180267965895249,
23
+ "grad_norm": 6.916630744934082,
24
+ "learning_rate": 2.5675675675675675e-05,
25
+ "loss": 3.957,
26
+ "mean_token_accuracy": 0.3799716055393219,
27
+ "num_tokens": 264238.0,
28
+ "step": 20
29
+ },
30
+ {
31
+ "epoch": 0.018270401948842874,
32
+ "grad_norm": 2.717982292175293,
33
+ "learning_rate": 3.918918918918919e-05,
34
+ "loss": 3.047,
35
+ "mean_token_accuracy": 0.46811963245272636,
36
+ "num_tokens": 401308.0,
37
+ "step": 30
38
+ },
39
+ {
40
+ "epoch": 0.024360535931790498,
41
+ "grad_norm": 2.407865524291992,
42
+ "learning_rate": 5.27027027027027e-05,
43
+ "loss": 2.5322,
44
+ "mean_token_accuracy": 0.5190828196704388,
45
+ "num_tokens": 532444.0,
46
+ "step": 40
47
+ },
48
+ {
49
+ "epoch": 0.030450669914738125,
50
+ "grad_norm": 1.018301248550415,
51
+ "learning_rate": 6.621621621621621e-05,
52
+ "loss": 2.1325,
53
+ "mean_token_accuracy": 0.5782605841755867,
54
+ "num_tokens": 660406.0,
55
+ "step": 50
56
+ },
57
+ {
58
+ "epoch": 0.03654080389768575,
59
+ "grad_norm": 0.7315741181373596,
60
+ "learning_rate": 7.972972972972974e-05,
61
+ "loss": 1.9044,
62
+ "mean_token_accuracy": 0.6264914631843567,
63
+ "num_tokens": 795304.0,
64
+ "step": 60
65
+ },
66
+ {
67
+ "epoch": 0.04263093788063337,
68
+ "grad_norm": 0.6652920246124268,
69
+ "learning_rate": 9.324324324324324e-05,
70
+ "loss": 1.633,
71
+ "mean_token_accuracy": 0.6683938711881637,
72
+ "num_tokens": 934543.0,
73
+ "step": 70
74
+ },
75
+ {
76
+ "epoch": 0.048721071863580996,
77
+ "grad_norm": 0.6119660139083862,
78
+ "learning_rate": 0.00010675675675675677,
79
+ "loss": 1.543,
80
+ "mean_token_accuracy": 0.6834091022610664,
81
+ "num_tokens": 1070669.0,
82
+ "step": 80
83
+ },
84
+ {
85
+ "epoch": 0.05481120584652863,
86
+ "grad_norm": 0.591424286365509,
87
+ "learning_rate": 0.00012027027027027027,
88
+ "loss": 1.4154,
89
+ "mean_token_accuracy": 0.6991497233510018,
90
+ "num_tokens": 1211114.0,
91
+ "step": 90
92
+ },
93
+ {
94
+ "epoch": 0.06090133982947625,
95
+ "grad_norm": 0.5663530230522156,
96
+ "learning_rate": 0.0001337837837837838,
97
+ "loss": 1.3176,
98
+ "mean_token_accuracy": 0.7089206710457802,
99
+ "num_tokens": 1349584.0,
100
+ "step": 100
101
+ },
102
+ {
103
+ "epoch": 0.06699147381242387,
104
+ "grad_norm": 0.5881878137588501,
105
+ "learning_rate": 0.0001472972972972973,
106
+ "loss": 1.2293,
107
+ "mean_token_accuracy": 0.7254403859376908,
108
+ "num_tokens": 1487515.0,
109
+ "step": 110
110
+ },
111
+ {
112
+ "epoch": 0.0730816077953715,
113
+ "grad_norm": 0.7664394974708557,
114
+ "learning_rate": 0.00016081081081081083,
115
+ "loss": 1.1814,
116
+ "mean_token_accuracy": 0.7306812778115273,
117
+ "num_tokens": 1618603.0,
118
+ "step": 120
119
+ },
120
+ {
121
+ "epoch": 0.07917174177831912,
122
+ "grad_norm": 0.6155670881271362,
123
+ "learning_rate": 0.00017432432432432432,
124
+ "loss": 1.1967,
125
+ "mean_token_accuracy": 0.7284250959753991,
126
+ "num_tokens": 1750466.0,
127
+ "step": 130
128
+ },
129
+ {
130
+ "epoch": 0.08526187576126674,
131
+ "grad_norm": 0.5296258330345154,
132
+ "learning_rate": 0.00018783783783783784,
133
+ "loss": 1.0955,
134
+ "mean_token_accuracy": 0.7472824215888977,
135
+ "num_tokens": 1887913.0,
136
+ "step": 140
137
+ },
138
+ {
139
+ "epoch": 0.09135200974421437,
140
+ "grad_norm": 0.5564976334571838,
141
+ "learning_rate": 0.00019999998054550544,
142
+ "loss": 1.118,
143
+ "mean_token_accuracy": 0.7397311359643937,
144
+ "num_tokens": 2018579.0,
145
+ "step": 150
146
+ },
147
+ {
148
+ "epoch": 0.09744214372716199,
149
+ "grad_norm": 0.5301142930984497,
150
+ "learning_rate": 0.00019999764601633156,
151
+ "loss": 1.045,
152
+ "mean_token_accuracy": 0.7519380420446395,
153
+ "num_tokens": 2158851.0,
154
+ "step": 160
155
+ },
156
+ {
157
+ "epoch": 0.10353227771010962,
158
+ "grad_norm": 0.5949111580848694,
159
+ "learning_rate": 0.00019999142070388495,
160
+ "loss": 1.0497,
161
+ "mean_token_accuracy": 0.7520910769701004,
162
+ "num_tokens": 2296715.0,
163
+ "step": 170
164
+ },
165
+ {
166
+ "epoch": 0.10962241169305725,
167
+ "grad_norm": 0.6169262528419495,
168
+ "learning_rate": 0.0001999813048772986,
169
+ "loss": 1.0821,
170
+ "mean_token_accuracy": 0.7406247839331627,
171
+ "num_tokens": 2424756.0,
172
+ "step": 180
173
+ },
174
+ {
175
+ "epoch": 0.11571254567600488,
176
+ "grad_norm": 0.58912593126297,
177
+ "learning_rate": 0.00019996729897390057,
178
+ "loss": 1.0286,
179
+ "mean_token_accuracy": 0.7527454376220704,
180
+ "num_tokens": 2559362.0,
181
+ "step": 190
182
+ },
183
+ {
184
+ "epoch": 0.1218026796589525,
185
+ "grad_norm": 0.5084304213523865,
186
+ "learning_rate": 0.00019994940359919483,
187
+ "loss": 0.992,
188
+ "mean_token_accuracy": 0.7640391126275062,
189
+ "num_tokens": 2700231.0,
190
+ "step": 200
191
+ },
192
+ {
193
+ "epoch": 0.1278928136419001,
194
+ "grad_norm": 0.5790796279907227,
195
+ "learning_rate": 0.00019992761952683516,
196
+ "loss": 1.0146,
197
+ "mean_token_accuracy": 0.7554366230964661,
198
+ "num_tokens": 2831324.0,
199
+ "step": 210
200
+ },
201
+ {
202
+ "epoch": 0.13398294762484775,
203
+ "grad_norm": 0.5852051377296448,
204
+ "learning_rate": 0.00019990194769859188,
205
+ "loss": 0.978,
206
+ "mean_token_accuracy": 0.7612502485513687,
207
+ "num_tokens": 2967346.0,
208
+ "step": 220
209
+ },
210
+ {
211
+ "epoch": 0.14007308160779536,
212
+ "grad_norm": 0.5102785229682922,
213
+ "learning_rate": 0.00019987238922431088,
214
+ "loss": 0.9616,
215
+ "mean_token_accuracy": 0.7677591517567635,
216
+ "num_tokens": 3110936.0,
217
+ "step": 230
218
+ },
219
+ {
220
+ "epoch": 0.146163215590743,
221
+ "grad_norm": 0.5472669005393982,
222
+ "learning_rate": 0.00019983894538186576,
223
+ "loss": 0.9535,
224
+ "mean_token_accuracy": 0.76737689524889,
225
+ "num_tokens": 3247496.0,
226
+ "step": 240
227
+ },
228
+ {
229
+ "epoch": 0.15225334957369063,
230
+ "grad_norm": 0.5611053109169006,
231
+ "learning_rate": 0.0001998016176171026,
232
+ "loss": 0.9577,
233
+ "mean_token_accuracy": 0.7626092001795769,
234
+ "num_tokens": 3384178.0,
235
+ "step": 250
236
+ },
237
+ {
238
+ "epoch": 0.15834348355663824,
239
+ "grad_norm": 0.54055255651474,
240
+ "learning_rate": 0.0001997604075437774,
241
+ "loss": 0.9907,
242
+ "mean_token_accuracy": 0.7575223430991173,
243
+ "num_tokens": 3517617.0,
244
+ "step": 260
245
+ },
246
+ {
247
+ "epoch": 0.16443361753958588,
248
+ "grad_norm": 0.558316707611084,
249
+ "learning_rate": 0.0001997153169434864,
250
+ "loss": 0.944,
251
+ "mean_token_accuracy": 0.7664194419980049,
252
+ "num_tokens": 3662878.0,
253
+ "step": 270
254
+ },
255
+ {
256
+ "epoch": 0.1705237515225335,
257
+ "grad_norm": 0.49766939878463745,
258
+ "learning_rate": 0.0001996663477655889,
259
+ "loss": 0.9106,
260
+ "mean_token_accuracy": 0.7760038167238236,
261
+ "num_tokens": 3807411.0,
262
+ "step": 280
263
+ },
264
+ {
265
+ "epoch": 0.17661388550548113,
266
+ "grad_norm": 0.4953667223453522,
267
+ "learning_rate": 0.0001996135021271232,
268
+ "loss": 0.9687,
269
+ "mean_token_accuracy": 0.7605679705739021,
270
+ "num_tokens": 3936840.0,
271
+ "step": 290
272
+ },
273
+ {
274
+ "epoch": 0.18270401948842874,
275
+ "grad_norm": 0.5447947978973389,
276
+ "learning_rate": 0.00019955678231271484,
277
+ "loss": 0.9625,
278
+ "mean_token_accuracy": 0.7603292793035508,
279
+ "num_tokens": 4067826.0,
280
+ "step": 300
281
+ },
282
+ {
283
+ "epoch": 0.18879415347137637,
284
+ "grad_norm": 0.4665842056274414,
285
+ "learning_rate": 0.00019949619077447807,
286
+ "loss": 0.9372,
287
+ "mean_token_accuracy": 0.7676101759076118,
288
+ "num_tokens": 4205887.0,
289
+ "step": 310
290
+ },
291
+ {
292
+ "epoch": 0.19488428745432398,
293
+ "grad_norm": 0.515690267086029,
294
+ "learning_rate": 0.00019943173013190965,
295
+ "loss": 0.923,
296
+ "mean_token_accuracy": 0.7708473294973374,
297
+ "num_tokens": 4342894.0,
298
+ "step": 320
299
+ },
300
+ {
301
+ "epoch": 0.20097442143727162,
302
+ "grad_norm": 0.5831382274627686,
303
+ "learning_rate": 0.00019936340317177565,
304
+ "loss": 0.9203,
305
+ "mean_token_accuracy": 0.7708552837371826,
306
+ "num_tokens": 4477651.0,
307
+ "step": 330
308
+ },
309
+ {
310
+ "epoch": 0.20706455542021923,
311
+ "grad_norm": 0.6162773966789246,
312
+ "learning_rate": 0.0001992912128479911,
313
+ "loss": 0.916,
314
+ "mean_token_accuracy": 0.7702088996767997,
315
+ "num_tokens": 4610746.0,
316
+ "step": 340
317
+ },
318
+ {
319
+ "epoch": 0.21315468940316687,
320
+ "grad_norm": 0.5172462463378906,
321
+ "learning_rate": 0.00019921516228149207,
322
+ "loss": 0.8942,
323
+ "mean_token_accuracy": 0.7741821393370628,
324
+ "num_tokens": 4751175.0,
325
+ "step": 350
326
+ },
327
+ {
328
+ "epoch": 0.2192448233861145,
329
+ "grad_norm": 0.5890468955039978,
330
+ "learning_rate": 0.0001991352547601009,
331
+ "loss": 0.9229,
332
+ "mean_token_accuracy": 0.7691043332219124,
333
+ "num_tokens": 4882328.0,
334
+ "step": 360
335
+ },
336
+ {
337
+ "epoch": 0.22533495736906212,
338
+ "grad_norm": 0.5522404909133911,
339
+ "learning_rate": 0.00019905149373838408,
340
+ "loss": 0.9294,
341
+ "mean_token_accuracy": 0.7646071568131447,
342
+ "num_tokens": 5012181.0,
343
+ "step": 370
344
+ },
345
+ {
346
+ "epoch": 0.23142509135200975,
347
+ "grad_norm": 0.5349445939064026,
348
+ "learning_rate": 0.0001989638828375028,
349
+ "loss": 0.8797,
350
+ "mean_token_accuracy": 0.7771721839904785,
351
+ "num_tokens": 5151133.0,
352
+ "step": 380
353
+ },
354
+ {
355
+ "epoch": 0.23751522533495736,
356
+ "grad_norm": 0.531052827835083,
357
+ "learning_rate": 0.00019887242584505635,
358
+ "loss": 0.9221,
359
+ "mean_token_accuracy": 0.7678465083241462,
360
+ "num_tokens": 5279790.0,
361
+ "step": 390
362
+ },
363
+ {
364
+ "epoch": 0.243605359317905,
365
+ "grad_norm": 0.5126324892044067,
366
+ "learning_rate": 0.00019877712671491864,
367
+ "loss": 0.8862,
368
+ "mean_token_accuracy": 0.7739894777536392,
369
+ "num_tokens": 5412390.0,
370
+ "step": 400
371
+ },
372
+ {
373
+ "epoch": 0.2496954933008526,
374
+ "grad_norm": 0.5111438632011414,
375
+ "learning_rate": 0.00019867798956706693,
376
+ "loss": 0.9005,
377
+ "mean_token_accuracy": 0.7721902653574944,
378
+ "num_tokens": 5545801.0,
379
+ "step": 410
380
+ },
381
+ {
382
+ "epoch": 0.2557856272838002,
383
+ "grad_norm": 0.5488138794898987,
384
+ "learning_rate": 0.00019857501868740402,
385
+ "loss": 0.8988,
386
+ "mean_token_accuracy": 0.7690282896161079,
387
+ "num_tokens": 5673758.0,
388
+ "step": 420
389
+ },
390
+ {
391
+ "epoch": 0.2618757612667479,
392
+ "grad_norm": 0.5497994422912598,
393
+ "learning_rate": 0.0001984682185275727,
394
+ "loss": 0.8802,
395
+ "mean_token_accuracy": 0.7780183687806129,
396
+ "num_tokens": 5813158.0,
397
+ "step": 430
398
+ },
399
+ {
400
+ "epoch": 0.2679658952496955,
401
+ "grad_norm": 0.5478431582450867,
402
+ "learning_rate": 0.0001983575937047635,
403
+ "loss": 0.865,
404
+ "mean_token_accuracy": 0.7785944610834121,
405
+ "num_tokens": 5947367.0,
406
+ "step": 440
407
+ },
408
+ {
409
+ "epoch": 0.2740560292326431,
410
+ "grad_norm": 0.5188766717910767,
411
+ "learning_rate": 0.00019824314900151487,
412
+ "loss": 0.8798,
413
+ "mean_token_accuracy": 0.7752803862094879,
414
+ "num_tokens": 6081060.0,
415
+ "step": 450
416
+ },
417
+ {
418
+ "epoch": 0.2801461632155907,
419
+ "grad_norm": 0.530222475528717,
420
+ "learning_rate": 0.00019812488936550666,
421
+ "loss": 0.8628,
422
+ "mean_token_accuracy": 0.7801630645990372,
423
+ "num_tokens": 6217834.0,
424
+ "step": 460
425
+ },
426
+ {
427
+ "epoch": 0.2862362971985384,
428
+ "grad_norm": 0.5987964868545532,
429
+ "learning_rate": 0.00019800281990934614,
430
+ "loss": 0.8775,
431
+ "mean_token_accuracy": 0.7760324433445931,
432
+ "num_tokens": 6350451.0,
433
+ "step": 470
434
+ },
435
+ {
436
+ "epoch": 0.292326431181486,
437
+ "grad_norm": 0.5468559265136719,
438
+ "learning_rate": 0.0001978769459103468,
439
+ "loss": 0.8721,
440
+ "mean_token_accuracy": 0.7794204503297806,
441
+ "num_tokens": 6484738.0,
442
+ "step": 480
443
+ },
444
+ {
445
+ "epoch": 0.2984165651644336,
446
+ "grad_norm": 0.5541098117828369,
447
+ "learning_rate": 0.0001977472728103005,
448
+ "loss": 0.8785,
449
+ "mean_token_accuracy": 0.7767582029104233,
450
+ "num_tokens": 6619313.0,
451
+ "step": 490
452
+ },
453
+ {
454
+ "epoch": 0.30450669914738127,
455
+ "grad_norm": 0.5134281516075134,
456
+ "learning_rate": 0.0001976138062152419,
457
+ "loss": 0.8717,
458
+ "mean_token_accuracy": 0.7752724394202233,
459
+ "num_tokens": 6753195.0,
460
+ "step": 500
461
+ },
462
+ {
463
+ "epoch": 0.3105968331303289,
464
+ "grad_norm": 0.49164435267448425,
465
+ "learning_rate": 0.00019747655189520633,
466
+ "loss": 0.8757,
467
+ "mean_token_accuracy": 0.7768464118242264,
468
+ "num_tokens": 6890448.0,
469
+ "step": 510
470
+ },
471
+ {
472
+ "epoch": 0.3166869671132765,
473
+ "grad_norm": 0.5899345278739929,
474
+ "learning_rate": 0.00019733551578398023,
475
+ "loss": 0.8322,
476
+ "mean_token_accuracy": 0.7859320402145386,
477
+ "num_tokens": 7027488.0,
478
+ "step": 520
479
+ },
480
+ {
481
+ "epoch": 0.3227771010962241,
482
+ "grad_norm": 0.6552841663360596,
483
+ "learning_rate": 0.0001971907039788447,
484
+ "loss": 0.861,
485
+ "mean_token_accuracy": 0.7770532324910164,
486
+ "num_tokens": 7161184.0,
487
+ "step": 530
488
+ },
489
+ {
490
+ "epoch": 0.32886723507917176,
491
+ "grad_norm": 0.5038822889328003,
492
+ "learning_rate": 0.0001970421227403117,
493
+ "loss": 0.8825,
494
+ "mean_token_accuracy": 0.775890800356865,
495
+ "num_tokens": 7294399.0,
496
+ "step": 540
497
+ },
498
+ {
499
+ "epoch": 0.33495736906211937,
500
+ "grad_norm": 0.5094267129898071,
501
+ "learning_rate": 0.00019688977849185378,
502
+ "loss": 0.8598,
503
+ "mean_token_accuracy": 0.7817838475108146,
504
+ "num_tokens": 7427183.0,
505
+ "step": 550
506
+ },
507
+ {
508
+ "epoch": 0.341047503045067,
509
+ "grad_norm": 0.5282809138298035,
510
+ "learning_rate": 0.00019673367781962594,
511
+ "loss": 0.8463,
512
+ "mean_token_accuracy": 0.7812959104776382,
513
+ "num_tokens": 7561734.0,
514
+ "step": 560
515
+ },
516
+ {
517
+ "epoch": 0.3471376370280146,
518
+ "grad_norm": 0.45355409383773804,
519
+ "learning_rate": 0.00019657382747218123,
520
+ "loss": 0.8207,
521
+ "mean_token_accuracy": 0.7888262197375298,
522
+ "num_tokens": 7706228.0,
523
+ "step": 570
524
+ },
525
+ {
526
+ "epoch": 0.35322777101096225,
527
+ "grad_norm": 0.5162333846092224,
528
+ "learning_rate": 0.00019641023436017883,
529
+ "loss": 0.8235,
530
+ "mean_token_accuracy": 0.7868947923183441,
531
+ "num_tokens": 7846684.0,
532
+ "step": 580
533
+ },
534
+ {
535
+ "epoch": 0.35931790499390986,
536
+ "grad_norm": 0.5194632411003113,
537
+ "learning_rate": 0.00019624290555608526,
538
+ "loss": 0.8129,
539
+ "mean_token_accuracy": 0.7884069249033928,
540
+ "num_tokens": 7986811.0,
541
+ "step": 590
542
+ },
543
+ {
544
+ "epoch": 0.3654080389768575,
545
+ "grad_norm": 0.5494846701622009,
546
+ "learning_rate": 0.00019607184829386882,
547
+ "loss": 0.8084,
548
+ "mean_token_accuracy": 0.7874000474810601,
549
+ "num_tokens": 8124538.0,
550
+ "step": 600
551
+ },
552
+ {
553
+ "epoch": 0.37149817295980514,
554
+ "grad_norm": 0.5368776917457581,
555
+ "learning_rate": 0.0001958970699686866,
556
+ "loss": 0.8225,
557
+ "mean_token_accuracy": 0.783010233938694,
558
+ "num_tokens": 8260529.0,
559
+ "step": 610
560
+ },
561
+ {
562
+ "epoch": 0.37758830694275275,
563
+ "grad_norm": 0.6229024529457092,
564
+ "learning_rate": 0.00019571857813656496,
565
+ "loss": 0.8786,
566
+ "mean_token_accuracy": 0.7753148928284646,
567
+ "num_tokens": 8389042.0,
568
+ "step": 620
569
+ },
570
+ {
571
+ "epoch": 0.38367844092570036,
572
+ "grad_norm": 0.5601000785827637,
573
+ "learning_rate": 0.00019553638051407279,
574
+ "loss": 0.8909,
575
+ "mean_token_accuracy": 0.7745720192790031,
576
+ "num_tokens": 8513603.0,
577
+ "step": 630
578
+ },
579
+ {
580
+ "epoch": 0.38976857490864797,
581
+ "grad_norm": 0.438970685005188,
582
+ "learning_rate": 0.0001953504849779879,
583
+ "loss": 0.8085,
584
+ "mean_token_accuracy": 0.7871840804815292,
585
+ "num_tokens": 8652970.0,
586
+ "step": 640
587
+ },
588
+ {
589
+ "epoch": 0.39585870889159563,
590
+ "grad_norm": 0.5505132079124451,
591
+ "learning_rate": 0.00019516089956495648,
592
+ "loss": 0.8102,
593
+ "mean_token_accuracy": 0.7869585514068603,
594
+ "num_tokens": 8792103.0,
595
+ "step": 650
596
+ },
597
+ {
598
+ "epoch": 0.40194884287454324,
599
+ "grad_norm": 0.5447221398353577,
600
+ "learning_rate": 0.00019496763247114581,
601
+ "loss": 0.8336,
602
+ "mean_token_accuracy": 0.7816034242510795,
603
+ "num_tokens": 8926853.0,
604
+ "step": 660
605
+ },
606
+ {
607
+ "epoch": 0.40803897685749085,
608
+ "grad_norm": 0.4652746915817261,
609
+ "learning_rate": 0.00019477069205188965,
610
+ "loss": 0.8383,
611
+ "mean_token_accuracy": 0.7826304718852043,
612
+ "num_tokens": 9059592.0,
613
+ "step": 670
614
+ },
615
+ {
616
+ "epoch": 0.41412911084043846,
617
+ "grad_norm": 0.42363590002059937,
618
+ "learning_rate": 0.00019457008682132726,
619
+ "loss": 0.847,
620
+ "mean_token_accuracy": 0.7810002073645592,
621
+ "num_tokens": 9193062.0,
622
+ "step": 680
623
+ },
624
+ {
625
+ "epoch": 0.42021924482338613,
626
+ "grad_norm": 0.5209478735923767,
627
+ "learning_rate": 0.00019436582545203518,
628
+ "loss": 0.8766,
629
+ "mean_token_accuracy": 0.7733785718679428,
630
+ "num_tokens": 9315805.0,
631
+ "step": 690
632
+ },
633
+ {
634
+ "epoch": 0.42630937880633374,
635
+ "grad_norm": 0.5176642537117004,
636
+ "learning_rate": 0.00019415791677465237,
637
+ "loss": 0.8155,
638
+ "mean_token_accuracy": 0.7869213685393334,
639
+ "num_tokens": 9448863.0,
640
+ "step": 700
641
+ },
642
+ {
643
+ "epoch": 0.43239951278928135,
644
+ "grad_norm": 0.4531058371067047,
645
+ "learning_rate": 0.00019394636977749843,
646
+ "loss": 0.8096,
647
+ "mean_token_accuracy": 0.7903949975967407,
648
+ "num_tokens": 9589382.0,
649
+ "step": 710
650
+ },
651
+ {
652
+ "epoch": 0.438489646772229,
653
+ "grad_norm": 0.5651549100875854,
654
+ "learning_rate": 0.000193731193606185,
655
+ "loss": 0.8263,
656
+ "mean_token_accuracy": 0.7823062822222709,
657
+ "num_tokens": 9723562.0,
658
+ "step": 720
659
+ },
660
+ {
661
+ "epoch": 0.4445797807551766,
662
+ "grad_norm": 0.5377989411354065,
663
+ "learning_rate": 0.00019351239756322031,
664
+ "loss": 0.7993,
665
+ "mean_token_accuracy": 0.7908329650759697,
666
+ "num_tokens": 9859255.0,
667
+ "step": 730
668
+ },
669
+ {
670
+ "epoch": 0.45066991473812423,
671
+ "grad_norm": 0.5420868396759033,
672
+ "learning_rate": 0.00019328999110760722,
673
+ "loss": 0.8461,
674
+ "mean_token_accuracy": 0.7780480548739434,
675
+ "num_tokens": 9981578.0,
676
+ "step": 740
677
+ },
678
+ {
679
+ "epoch": 0.45676004872107184,
680
+ "grad_norm": 0.4889216125011444,
681
+ "learning_rate": 0.000193063983854434,
682
+ "loss": 0.7652,
683
+ "mean_token_accuracy": 0.7959530428051949,
684
+ "num_tokens": 10122922.0,
685
+ "step": 750
686
+ },
687
+ {
688
+ "epoch": 0.4628501827040195,
689
+ "grad_norm": 0.5044087767601013,
690
+ "learning_rate": 0.00019283438557445893,
691
+ "loss": 0.824,
692
+ "mean_token_accuracy": 0.7845935523509979,
693
+ "num_tokens": 10252854.0,
694
+ "step": 760
695
+ },
696
+ {
697
+ "epoch": 0.4689403166869671,
698
+ "grad_norm": 0.5286466479301453,
699
+ "learning_rate": 0.00019260120619368773,
700
+ "loss": 0.815,
701
+ "mean_token_accuracy": 0.7850656941533088,
702
+ "num_tokens": 10385075.0,
703
+ "step": 770
704
+ },
705
+ {
706
+ "epoch": 0.47503045066991473,
707
+ "grad_norm": 0.5441628694534302,
708
+ "learning_rate": 0.00019236445579294437,
709
+ "loss": 0.8048,
710
+ "mean_token_accuracy": 0.7876680314540863,
711
+ "num_tokens": 10520011.0,
712
+ "step": 780
713
+ },
714
+ {
715
+ "epoch": 0.48112058465286234,
716
+ "grad_norm": 0.49002447724342346,
717
+ "learning_rate": 0.0001921241446074355,
718
+ "loss": 0.8059,
719
+ "mean_token_accuracy": 0.7898563235998154,
720
+ "num_tokens": 10652488.0,
721
+ "step": 790
722
+ },
723
+ {
724
+ "epoch": 0.48721071863581,
725
+ "grad_norm": 0.4479144811630249,
726
+ "learning_rate": 0.0001918802830263077,
727
+ "loss": 0.7913,
728
+ "mean_token_accuracy": 0.7928732186555862,
729
+ "num_tokens": 10785974.0,
730
+ "step": 800
731
+ },
732
+ {
733
+ "epoch": 0.4933008526187576,
734
+ "grad_norm": 0.5007497668266296,
735
+ "learning_rate": 0.00019163288159219853,
736
+ "loss": 0.8083,
737
+ "mean_token_accuracy": 0.7893043681979179,
738
+ "num_tokens": 10920950.0,
739
+ "step": 810
740
+ },
741
+ {
742
+ "epoch": 0.4993909866017052,
743
+ "grad_norm": 0.5289483070373535,
744
+ "learning_rate": 0.00019138195100078064,
745
+ "loss": 0.8033,
746
+ "mean_token_accuracy": 0.7864485770463944,
747
+ "num_tokens": 11056380.0,
748
+ "step": 820
749
+ },
750
+ {
751
+ "epoch": 0.5054811205846529,
752
+ "grad_norm": 0.5604159832000732,
753
+ "learning_rate": 0.0001911275021002994,
754
+ "loss": 0.7652,
755
+ "mean_token_accuracy": 0.7946401730179786,
756
+ "num_tokens": 11196074.0,
757
+ "step": 830
758
+ },
759
+ {
760
+ "epoch": 0.5115712545676004,
761
+ "grad_norm": 0.43645399808883667,
762
+ "learning_rate": 0.00019086954589110397,
763
+ "loss": 0.7724,
764
+ "mean_token_accuracy": 0.7990294560790062,
765
+ "num_tokens": 11337990.0,
766
+ "step": 840
767
+ },
768
+ {
769
+ "epoch": 0.5176613885505481,
770
+ "grad_norm": 0.43992146849632263,
771
+ "learning_rate": 0.0001906080935251716,
772
+ "loss": 0.7612,
773
+ "mean_token_accuracy": 0.7999786615371705,
774
+ "num_tokens": 11481565.0,
775
+ "step": 850
776
+ },
777
+ {
778
+ "epoch": 0.5237515225334958,
779
+ "grad_norm": 0.5595120191574097,
780
+ "learning_rate": 0.0001903431563056256,
781
+ "loss": 0.8266,
782
+ "mean_token_accuracy": 0.7859750911593437,
783
+ "num_tokens": 11611714.0,
784
+ "step": 860
785
+ },
786
+ {
787
+ "epoch": 0.5298416565164433,
788
+ "grad_norm": 0.5001987218856812,
789
+ "learning_rate": 0.0001900747456862467,
790
+ "loss": 0.8506,
791
+ "mean_token_accuracy": 0.779585388302803,
792
+ "num_tokens": 11736573.0,
793
+ "step": 870
794
+ },
795
+ {
796
+ "epoch": 0.535931790499391,
797
+ "grad_norm": 0.430147647857666,
798
+ "learning_rate": 0.00018980287327097784,
799
+ "loss": 0.7707,
800
+ "mean_token_accuracy": 0.795211361348629,
801
+ "num_tokens": 11876859.0,
802
+ "step": 880
803
+ },
804
+ {
805
+ "epoch": 0.5420219244823387,
806
+ "grad_norm": 0.5346289873123169,
807
+ "learning_rate": 0.00018952755081342245,
808
+ "loss": 0.8057,
809
+ "mean_token_accuracy": 0.7871127843856811,
810
+ "num_tokens": 12007654.0,
811
+ "step": 890
812
+ },
813
+ {
814
+ "epoch": 0.5481120584652862,
815
+ "grad_norm": 0.46072253584861755,
816
+ "learning_rate": 0.00018924879021633653,
817
+ "loss": 0.7924,
818
+ "mean_token_accuracy": 0.7913773030042648,
819
+ "num_tokens": 12140520.0,
820
+ "step": 900
821
+ },
822
+ {
823
+ "epoch": 0.5542021924482339,
824
+ "grad_norm": 0.4803653955459595,
825
+ "learning_rate": 0.00018896660353111375,
826
+ "loss": 0.8398,
827
+ "mean_token_accuracy": 0.7807079553604126,
828
+ "num_tokens": 12267219.0,
829
+ "step": 910
830
+ },
831
+ {
832
+ "epoch": 0.5602923264311814,
833
+ "grad_norm": 0.5219636559486389,
834
+ "learning_rate": 0.0001886810029572647,
835
+ "loss": 0.7612,
836
+ "mean_token_accuracy": 0.7993015512824059,
837
+ "num_tokens": 12404646.0,
838
+ "step": 920
839
+ },
840
+ {
841
+ "epoch": 0.5663824604141291,
842
+ "grad_norm": 0.501483142375946,
843
+ "learning_rate": 0.00018839200084188936,
844
+ "loss": 0.7953,
845
+ "mean_token_accuracy": 0.787814213335514,
846
+ "num_tokens": 12538219.0,
847
+ "step": 930
848
+ },
849
+ {
850
+ "epoch": 0.5724725943970768,
851
+ "grad_norm": 0.47334522008895874,
852
+ "learning_rate": 0.00018809960967914346,
853
+ "loss": 0.789,
854
+ "mean_token_accuracy": 0.7928574904799461,
855
+ "num_tokens": 12673805.0,
856
+ "step": 940
857
+ },
858
+ {
859
+ "epoch": 0.5785627283800243,
860
+ "grad_norm": 0.5057492852210999,
861
+ "learning_rate": 0.00018780384210969806,
862
+ "loss": 0.7746,
863
+ "mean_token_accuracy": 0.7947553545236588,
864
+ "num_tokens": 12811727.0,
865
+ "step": 950
866
+ },
867
+ {
868
+ "epoch": 0.584652862362972,
869
+ "grad_norm": 0.5179910659790039,
870
+ "learning_rate": 0.00018750471092019325,
871
+ "loss": 0.7962,
872
+ "mean_token_accuracy": 0.7905686929821968,
873
+ "num_tokens": 12947641.0,
874
+ "step": 960
875
+ },
876
+ {
877
+ "epoch": 0.5907429963459196,
878
+ "grad_norm": 0.45797088742256165,
879
+ "learning_rate": 0.00018720222904268543,
880
+ "loss": 0.7678,
881
+ "mean_token_accuracy": 0.7969774708151818,
882
+ "num_tokens": 13083869.0,
883
+ "step": 970
884
+ },
885
+ {
886
+ "epoch": 0.5968331303288672,
887
+ "grad_norm": 0.48360612988471985,
888
+ "learning_rate": 0.00018689640955408803,
889
+ "loss": 0.7996,
890
+ "mean_token_accuracy": 0.7885591968894005,
891
+ "num_tokens": 13211807.0,
892
+ "step": 980
893
+ },
894
+ {
895
+ "epoch": 0.6029232643118149,
896
+ "grad_norm": 0.4378497004508972,
897
+ "learning_rate": 0.00018658726567560635,
898
+ "loss": 0.7652,
899
+ "mean_token_accuracy": 0.7969291344285011,
900
+ "num_tokens": 13351856.0,
901
+ "step": 990
902
+ },
903
+ {
904
+ "epoch": 0.6090133982947625,
905
+ "grad_norm": 0.4857536852359772,
906
+ "learning_rate": 0.00018627481077216577,
907
+ "loss": 0.7786,
908
+ "mean_token_accuracy": 0.7914443418383599,
909
+ "num_tokens": 13486443.0,
910
+ "step": 1000
911
+ },
912
+ {
913
+ "epoch": 0.6151035322777101,
914
+ "grad_norm": 0.5233064293861389,
915
+ "learning_rate": 0.0001859590583518343,
916
+ "loss": 0.8241,
917
+ "mean_token_accuracy": 0.7811850637197495,
918
+ "num_tokens": 13612035.0,
919
+ "step": 1010
920
+ },
921
+ {
922
+ "epoch": 0.6211936662606578,
923
+ "grad_norm": 0.5328738689422607,
924
+ "learning_rate": 0.00018564002206523816,
925
+ "loss": 0.7502,
926
+ "mean_token_accuracy": 0.7993430674076081,
927
+ "num_tokens": 13756509.0,
928
+ "step": 1020
929
+ },
930
+ {
931
+ "epoch": 0.6272838002436053,
932
+ "grad_norm": 0.47962310910224915,
933
+ "learning_rate": 0.000185317715704972,
934
+ "loss": 0.7984,
935
+ "mean_token_accuracy": 0.7864531084895134,
936
+ "num_tokens": 13883033.0,
937
+ "step": 1030
938
+ },
939
+ {
940
+ "epoch": 0.633373934226553,
941
+ "grad_norm": 0.5685893893241882,
942
+ "learning_rate": 0.0001849921532050024,
943
+ "loss": 0.7869,
944
+ "mean_token_accuracy": 0.7909937381744385,
945
+ "num_tokens": 14015234.0,
946
+ "step": 1040
947
+ },
948
+ {
949
+ "epoch": 0.6394640682095006,
950
+ "grad_norm": 0.49146631360054016,
951
+ "learning_rate": 0.00018466334864006566,
952
+ "loss": 0.7952,
953
+ "mean_token_accuracy": 0.7878949210047722,
954
+ "num_tokens": 14149319.0,
955
+ "step": 1050
956
+ },
957
+ {
958
+ "epoch": 0.6455542021924482,
959
+ "grad_norm": 0.5556225776672363,
960
+ "learning_rate": 0.0001843313162250591,
961
+ "loss": 0.7524,
962
+ "mean_token_accuracy": 0.7994373366236687,
963
+ "num_tokens": 14286868.0,
964
+ "step": 1060
965
+ },
966
+ {
967
+ "epoch": 0.6516443361753959,
968
+ "grad_norm": 0.511379063129425,
969
+ "learning_rate": 0.00018399607031442666,
970
+ "loss": 0.7929,
971
+ "mean_token_accuracy": 0.7921562284231186,
972
+ "num_tokens": 14418354.0,
973
+ "step": 1070
974
+ },
975
+ {
976
+ "epoch": 0.6577344701583435,
977
+ "grad_norm": 0.5019840598106384,
978
+ "learning_rate": 0.00018365762540153836,
979
+ "loss": 0.758,
980
+ "mean_token_accuracy": 0.7989353060722351,
981
+ "num_tokens": 14553174.0,
982
+ "step": 1080
983
+ },
984
+ {
985
+ "epoch": 0.6638246041412911,
986
+ "grad_norm": 0.6032467484474182,
987
+ "learning_rate": 0.00018331599611806366,
988
+ "loss": 0.7888,
989
+ "mean_token_accuracy": 0.7903819754719734,
990
+ "num_tokens": 14681393.0,
991
+ "step": 1090
992
+ },
993
+ {
994
+ "epoch": 0.6699147381242387,
995
+ "grad_norm": 0.5369830131530762,
996
+ "learning_rate": 0.00018297119723333877,
997
+ "loss": 0.765,
998
+ "mean_token_accuracy": 0.7950262635946274,
999
+ "num_tokens": 14814565.0,
1000
+ "step": 1100
1001
+ },
1002
+ {
1003
+ "epoch": 0.6760048721071864,
1004
+ "grad_norm": 0.5289803743362427,
1005
+ "learning_rate": 0.00018262324365372846,
1006
+ "loss": 0.7496,
1007
+ "mean_token_accuracy": 0.8032818242907525,
1008
+ "num_tokens": 14954351.0,
1009
+ "step": 1110
1010
+ },
1011
+ {
1012
+ "epoch": 0.682095006090134,
1013
+ "grad_norm": 0.5440439581871033,
1014
+ "learning_rate": 0.0001822721504219814,
1015
+ "loss": 0.7432,
1016
+ "mean_token_accuracy": 0.799126236140728,
1017
+ "num_tokens": 15094879.0,
1018
+ "step": 1120
1019
+ },
1020
+ {
1021
+ "epoch": 0.6881851400730816,
1022
+ "grad_norm": 0.46225935220718384,
1023
+ "learning_rate": 0.00018191793271657978,
1024
+ "loss": 0.7513,
1025
+ "mean_token_accuracy": 0.8022688791155815,
1026
+ "num_tokens": 15234906.0,
1027
+ "step": 1130
1028
+ },
1029
+ {
1030
+ "epoch": 0.6942752740560292,
1031
+ "grad_norm": 0.5592020750045776,
1032
+ "learning_rate": 0.0001815606058510833,
1033
+ "loss": 0.7583,
1034
+ "mean_token_accuracy": 0.7984497547149658,
1035
+ "num_tokens": 15373526.0,
1036
+ "step": 1140
1037
+ },
1038
+ {
1039
+ "epoch": 0.7003654080389768,
1040
+ "grad_norm": 0.525090217590332,
1041
+ "learning_rate": 0.00018120018527346702,
1042
+ "loss": 0.7254,
1043
+ "mean_token_accuracy": 0.8070619881153107,
1044
+ "num_tokens": 15516264.0,
1045
+ "step": 1150
1046
+ },
1047
+ {
1048
+ "epoch": 0.7064555420219245,
1049
+ "grad_norm": 0.5380759239196777,
1050
+ "learning_rate": 0.00018083668656545355,
1051
+ "loss": 0.8041,
1052
+ "mean_token_accuracy": 0.7866759791970253,
1053
+ "num_tokens": 15640444.0,
1054
+ "step": 1160
1055
+ },
1056
+ {
1057
+ "epoch": 0.7125456760048721,
1058
+ "grad_norm": 0.47815701365470886,
1059
+ "learning_rate": 0.00018047012544183938,
1060
+ "loss": 0.7604,
1061
+ "mean_token_accuracy": 0.796156468987465,
1062
+ "num_tokens": 15778070.0,
1063
+ "step": 1170
1064
+ },
1065
+ {
1066
+ "epoch": 0.7186358099878197,
1067
+ "grad_norm": 0.5380450487136841,
1068
+ "learning_rate": 0.00018010051774981553,
1069
+ "loss": 0.8135,
1070
+ "mean_token_accuracy": 0.7842124432325364,
1071
+ "num_tokens": 15899739.0,
1072
+ "step": 1180
1073
+ },
1074
+ {
1075
+ "epoch": 0.7247259439707674,
1076
+ "grad_norm": 0.5047502517700195,
1077
+ "learning_rate": 0.00017972787946828246,
1078
+ "loss": 0.7642,
1079
+ "mean_token_accuracy": 0.7989341139793396,
1080
+ "num_tokens": 16035805.0,
1081
+ "step": 1190
1082
+ },
1083
+ {
1084
+ "epoch": 0.730816077953715,
1085
+ "grad_norm": 0.5440967679023743,
1086
+ "learning_rate": 0.00017935222670715918,
1087
+ "loss": 0.735,
1088
+ "mean_token_accuracy": 0.8048294603824615,
1089
+ "num_tokens": 16172541.0,
1090
+ "step": 1200
1091
+ },
1092
+ {
1093
+ "epoch": 0.7369062119366626,
1094
+ "grad_norm": 0.4766077399253845,
1095
+ "learning_rate": 0.000178973575706687,
1096
+ "loss": 0.805,
1097
+ "mean_token_accuracy": 0.7871790423989296,
1098
+ "num_tokens": 16296988.0,
1099
+ "step": 1210
1100
+ },
1101
+ {
1102
+ "epoch": 0.7429963459196103,
1103
+ "grad_norm": 0.4153214991092682,
1104
+ "learning_rate": 0.00017859194283672704,
1105
+ "loss": 0.7635,
1106
+ "mean_token_accuracy": 0.7964595645666123,
1107
+ "num_tokens": 16432022.0,
1108
+ "step": 1220
1109
+ },
1110
+ {
1111
+ "epoch": 0.7490864799025578,
1112
+ "grad_norm": 0.4698518216609955,
1113
+ "learning_rate": 0.00017820734459605302,
1114
+ "loss": 0.7397,
1115
+ "mean_token_accuracy": 0.8046972885727882,
1116
+ "num_tokens": 16572880.0,
1117
+ "step": 1230
1118
+ },
1119
+ {
1120
+ "epoch": 0.7551766138855055,
1121
+ "grad_norm": 0.46101540327072144,
1122
+ "learning_rate": 0.00017781979761163756,
1123
+ "loss": 0.7174,
1124
+ "mean_token_accuracy": 0.8066875368356705,
1125
+ "num_tokens": 16714419.0,
1126
+ "step": 1240
1127
+ },
1128
+ {
1129
+ "epoch": 0.761266747868453,
1130
+ "grad_norm": 0.5313341021537781,
1131
+ "learning_rate": 0.00017742931863793358,
1132
+ "loss": 0.7797,
1133
+ "mean_token_accuracy": 0.7911526098847389,
1134
+ "num_tokens": 16838285.0,
1135
+ "step": 1250
1136
+ },
1137
+ {
1138
+ "epoch": 0.7673568818514007,
1139
+ "grad_norm": 0.4627362787723541,
1140
+ "learning_rate": 0.00017703592455614998,
1141
+ "loss": 0.7626,
1142
+ "mean_token_accuracy": 0.7970306649804115,
1143
+ "num_tokens": 16976065.0,
1144
+ "step": 1260
1145
+ },
1146
+ {
1147
+ "epoch": 0.7734470158343484,
1148
+ "grad_norm": 0.5429073572158813,
1149
+ "learning_rate": 0.00017663963237352177,
1150
+ "loss": 0.7398,
1151
+ "mean_token_accuracy": 0.8005403786897659,
1152
+ "num_tokens": 17112901.0,
1153
+ "step": 1270
1154
+ },
1155
+ {
1156
+ "epoch": 0.7795371498172959,
1157
+ "grad_norm": 0.6781270503997803,
1158
+ "learning_rate": 0.00017624045922257471,
1159
+ "loss": 0.7607,
1160
+ "mean_token_accuracy": 0.7946217939257622,
1161
+ "num_tokens": 17245480.0,
1162
+ "step": 1280
1163
+ },
1164
+ {
1165
+ "epoch": 0.7856272838002436,
1166
+ "grad_norm": 0.5227305293083191,
1167
+ "learning_rate": 0.00017583842236038483,
1168
+ "loss": 0.7217,
1169
+ "mean_token_accuracy": 0.8064659267663956,
1170
+ "num_tokens": 17387171.0,
1171
+ "step": 1290
1172
+ },
1173
+ {
1174
+ "epoch": 0.7917174177831913,
1175
+ "grad_norm": 0.49253156781196594,
1176
+ "learning_rate": 0.0001754335391678323,
1177
+ "loss": 0.7652,
1178
+ "mean_token_accuracy": 0.7960015773773194,
1179
+ "num_tokens": 17521164.0,
1180
+ "step": 1300
1181
+ },
1182
+ {
1183
+ "epoch": 0.7978075517661388,
1184
+ "grad_norm": 0.5103631615638733,
1185
+ "learning_rate": 0.00017502582714884997,
1186
+ "loss": 0.7435,
1187
+ "mean_token_accuracy": 0.7995276898145676,
1188
+ "num_tokens": 17657818.0,
1189
+ "step": 1310
1190
+ },
1191
+ {
1192
+ "epoch": 0.8038976857490865,
1193
+ "grad_norm": 0.5531247854232788,
1194
+ "learning_rate": 0.00017461530392966665,
1195
+ "loss": 0.7986,
1196
+ "mean_token_accuracy": 0.7892467245459557,
1197
+ "num_tokens": 17784361.0,
1198
+ "step": 1320
1199
+ },
1200
+ {
1201
+ "epoch": 0.8099878197320342,
1202
+ "grad_norm": 0.4574586749076843,
1203
+ "learning_rate": 0.00017420198725804517,
1204
+ "loss": 0.6889,
1205
+ "mean_token_accuracy": 0.8135112956166267,
1206
+ "num_tokens": 17929664.0,
1207
+ "step": 1330
1208
+ },
1209
+ {
1210
+ "epoch": 0.8160779537149817,
1211
+ "grad_norm": 0.4734383225440979,
1212
+ "learning_rate": 0.00017378589500251498,
1213
+ "loss": 0.7308,
1214
+ "mean_token_accuracy": 0.8029947131872177,
1215
+ "num_tokens": 18071182.0,
1216
+ "step": 1340
1217
+ },
1218
+ {
1219
+ "epoch": 0.8221680876979294,
1220
+ "grad_norm": 0.5192279815673828,
1221
+ "learning_rate": 0.00017336704515159986,
1222
+ "loss": 0.7444,
1223
+ "mean_token_accuracy": 0.8012512847781181,
1224
+ "num_tokens": 18211136.0,
1225
+ "step": 1350
1226
+ },
1227
+ {
1228
+ "epoch": 0.8282582216808769,
1229
+ "grad_norm": 0.5378620624542236,
1230
+ "learning_rate": 0.00017294545581303996,
1231
+ "loss": 0.7459,
1232
+ "mean_token_accuracy": 0.7981989249587059,
1233
+ "num_tokens": 18340645.0,
1234
+ "step": 1360
1235
+ },
1236
+ {
1237
+ "epoch": 0.8343483556638246,
1238
+ "grad_norm": 0.4879571497440338,
1239
+ "learning_rate": 0.00017252114521300918,
1240
+ "loss": 0.7877,
1241
+ "mean_token_accuracy": 0.7891893342137337,
1242
+ "num_tokens": 18465733.0,
1243
+ "step": 1370
1244
+ },
1245
+ {
1246
+ "epoch": 0.8404384896467723,
1247
+ "grad_norm": 0.5297388434410095,
1248
+ "learning_rate": 0.00017209413169532717,
1249
+ "loss": 0.7586,
1250
+ "mean_token_accuracy": 0.797142505645752,
1251
+ "num_tokens": 18598979.0,
1252
+ "step": 1380
1253
+ },
1254
+ {
1255
+ "epoch": 0.8465286236297198,
1256
+ "grad_norm": 0.5308396220207214,
1257
+ "learning_rate": 0.00017166443372066618,
1258
+ "loss": 0.7387,
1259
+ "mean_token_accuracy": 0.80123979896307,
1260
+ "num_tokens": 18735919.0,
1261
+ "step": 1390
1262
+ },
1263
+ {
1264
+ "epoch": 0.8526187576126675,
1265
+ "grad_norm": 0.49988579750061035,
1266
+ "learning_rate": 0.0001712320698657532,
1267
+ "loss": 0.7425,
1268
+ "mean_token_accuracy": 0.7996803268790245,
1269
+ "num_tokens": 18870877.0,
1270
+ "step": 1400
1271
+ },
1272
+ {
1273
+ "epoch": 0.8587088915956151,
1274
+ "grad_norm": 0.5971361994743347,
1275
+ "learning_rate": 0.0001707970588225665,
1276
+ "loss": 0.7691,
1277
+ "mean_token_accuracy": 0.7922965154051781,
1278
+ "num_tokens": 19000943.0,
1279
+ "step": 1410
1280
+ },
1281
+ {
1282
+ "epoch": 0.8647990255785627,
1283
+ "grad_norm": 0.5141698718070984,
1284
+ "learning_rate": 0.00017035941939752802,
1285
+ "loss": 0.7203,
1286
+ "mean_token_accuracy": 0.8036229625344277,
1287
+ "num_tokens": 19135039.0,
1288
+ "step": 1420
1289
+ },
1290
+ {
1291
+ "epoch": 0.8708891595615104,
1292
+ "grad_norm": 0.4647749066352844,
1293
+ "learning_rate": 0.0001699191705106898,
1294
+ "loss": 0.7136,
1295
+ "mean_token_accuracy": 0.8064323276281357,
1296
+ "num_tokens": 19274069.0,
1297
+ "step": 1430
1298
+ },
1299
+ {
1300
+ "epoch": 0.876979293544458,
1301
+ "grad_norm": 0.5511934161186218,
1302
+ "learning_rate": 0.00016947633119491633,
1303
+ "loss": 0.7455,
1304
+ "mean_token_accuracy": 0.7985599264502525,
1305
+ "num_tokens": 19409679.0,
1306
+ "step": 1440
1307
+ },
1308
+ {
1309
+ "epoch": 0.8830694275274056,
1310
+ "grad_norm": 0.4936945140361786,
1311
+ "learning_rate": 0.00016903092059506182,
1312
+ "loss": 0.7087,
1313
+ "mean_token_accuracy": 0.806523185968399,
1314
+ "num_tokens": 19547419.0,
1315
+ "step": 1450
1316
+ },
1317
+ {
1318
+ "epoch": 0.8891595615103532,
1319
+ "grad_norm": 0.5227787494659424,
1320
+ "learning_rate": 0.00016858295796714213,
1321
+ "loss": 0.7739,
1322
+ "mean_token_accuracy": 0.7941467314958572,
1323
+ "num_tokens": 19674455.0,
1324
+ "step": 1460
1325
+ },
1326
+ {
1327
+ "epoch": 0.8952496954933008,
1328
+ "grad_norm": 0.5046219825744629,
1329
+ "learning_rate": 0.00016813246267750282,
1330
+ "loss": 0.7361,
1331
+ "mean_token_accuracy": 0.8008369222283364,
1332
+ "num_tokens": 19809861.0,
1333
+ "step": 1470
1334
+ },
1335
+ {
1336
+ "epoch": 0.9013398294762485,
1337
+ "grad_norm": 0.4827081263065338,
1338
+ "learning_rate": 0.00016767945420198142,
1339
+ "loss": 0.7464,
1340
+ "mean_token_accuracy": 0.7986427888274192,
1341
+ "num_tokens": 19940696.0,
1342
+ "step": 1480
1343
+ },
1344
+ {
1345
+ "epoch": 0.9074299634591961,
1346
+ "grad_norm": 0.4970889687538147,
1347
+ "learning_rate": 0.00016722395212506567,
1348
+ "loss": 0.7528,
1349
+ "mean_token_accuracy": 0.7965970665216446,
1350
+ "num_tokens": 20070686.0,
1351
+ "step": 1490
1352
+ },
1353
+ {
1354
+ "epoch": 0.9135200974421437,
1355
+ "grad_norm": 0.44478070735931396,
1356
+ "learning_rate": 0.00016676597613904693,
1357
+ "loss": 0.7185,
1358
+ "mean_token_accuracy": 0.8081388726830483,
1359
+ "num_tokens": 20210260.0,
1360
+ "step": 1500
1361
+ },
1362
+ {
1363
+ "epoch": 0.9196102314250914,
1364
+ "grad_norm": 0.506136417388916,
1365
+ "learning_rate": 0.00016630554604316866,
1366
+ "loss": 0.7395,
1367
+ "mean_token_accuracy": 0.8003876298666001,
1368
+ "num_tokens": 20346235.0,
1369
+ "step": 1510
1370
+ },
1371
+ {
1372
+ "epoch": 0.925700365408039,
1373
+ "grad_norm": 0.500946044921875,
1374
+ "learning_rate": 0.00016584268174277053,
1375
+ "loss": 0.6889,
1376
+ "mean_token_accuracy": 0.8124501362442971,
1377
+ "num_tokens": 20481248.0,
1378
+ "step": 1520
1379
+ },
1380
+ {
1381
+ "epoch": 0.9317904993909866,
1382
+ "grad_norm": 0.48528990149497986,
1383
+ "learning_rate": 0.00016537740324842795,
1384
+ "loss": 0.7227,
1385
+ "mean_token_accuracy": 0.8041250064969063,
1386
+ "num_tokens": 20613531.0,
1387
+ "step": 1530
1388
+ },
1389
+ {
1390
+ "epoch": 0.9378806333739342,
1391
+ "grad_norm": 0.5070951581001282,
1392
+ "learning_rate": 0.00016490973067508674,
1393
+ "loss": 0.7091,
1394
+ "mean_token_accuracy": 0.8082544595003128,
1395
+ "num_tokens": 20750784.0,
1396
+ "step": 1540
1397
+ },
1398
+ {
1399
+ "epoch": 0.9439707673568819,
1400
+ "grad_norm": 0.5583120584487915,
1401
+ "learning_rate": 0.0001644396842411939,
1402
+ "loss": 0.7405,
1403
+ "mean_token_accuracy": 0.7992320343852043,
1404
+ "num_tokens": 20883646.0,
1405
+ "step": 1550
1406
+ },
1407
+ {
1408
+ "epoch": 0.9500609013398295,
1409
+ "grad_norm": 0.5099635124206543,
1410
+ "learning_rate": 0.00016396728426782312,
1411
+ "loss": 0.7103,
1412
+ "mean_token_accuracy": 0.8091216519474983,
1413
+ "num_tokens": 21025143.0,
1414
+ "step": 1560
1415
+ },
1416
+ {
1417
+ "epoch": 0.9561510353227771,
1418
+ "grad_norm": 0.5777808427810669,
1419
+ "learning_rate": 0.00016349255117779652,
1420
+ "loss": 0.7245,
1421
+ "mean_token_accuracy": 0.8023119494318962,
1422
+ "num_tokens": 21160014.0,
1423
+ "step": 1570
1424
+ },
1425
+ {
1426
+ "epoch": 0.9622411693057247,
1427
+ "grad_norm": 0.5206162333488464,
1428
+ "learning_rate": 0.0001630155054948016,
1429
+ "loss": 0.7185,
1430
+ "mean_token_accuracy": 0.8069521963596344,
1431
+ "num_tokens": 21299094.0,
1432
+ "step": 1580
1433
+ },
1434
+ {
1435
+ "epoch": 0.9683313032886723,
1436
+ "grad_norm": 0.5763202905654907,
1437
+ "learning_rate": 0.00016253616784250415,
1438
+ "loss": 0.7677,
1439
+ "mean_token_accuracy": 0.7927820891141891,
1440
+ "num_tokens": 21429252.0,
1441
+ "step": 1590
1442
+ },
1443
+ {
1444
+ "epoch": 0.97442143727162,
1445
+ "grad_norm": 0.5068426728248596,
1446
+ "learning_rate": 0.00016205455894365627,
1447
+ "loss": 0.7673,
1448
+ "mean_token_accuracy": 0.794715291261673,
1449
+ "num_tokens": 21556200.0,
1450
+ "step": 1600
1451
+ },
1452
+ {
1453
+ "epoch": 0.9805115712545676,
1454
+ "grad_norm": 0.46094459295272827,
1455
+ "learning_rate": 0.0001615706996192009,
1456
+ "loss": 0.771,
1457
+ "mean_token_accuracy": 0.7921045809984207,
1458
+ "num_tokens": 21681524.0,
1459
+ "step": 1610
1460
+ },
1461
+ {
1462
+ "epoch": 0.9866017052375152,
1463
+ "grad_norm": 0.5063546299934387,
1464
+ "learning_rate": 0.00016108461078737148,
1465
+ "loss": 0.7383,
1466
+ "mean_token_accuracy": 0.800596435368061,
1467
+ "num_tokens": 21814109.0,
1468
+ "step": 1620
1469
+ },
1470
+ {
1471
+ "epoch": 0.9926918392204629,
1472
+ "grad_norm": 0.5418652296066284,
1473
+ "learning_rate": 0.0001605963134627876,
1474
+ "loss": 0.7431,
1475
+ "mean_token_accuracy": 0.7994748756289483,
1476
+ "num_tokens": 21947346.0,
1477
+ "step": 1630
1478
+ },
1479
+ {
1480
+ "epoch": 0.9987819732034104,
1481
+ "grad_norm": 0.6195595264434814,
1482
+ "learning_rate": 0.0001601058287555465,
1483
+ "loss": 0.7294,
1484
+ "mean_token_accuracy": 0.8030684441328049,
1485
+ "num_tokens": 22081340.0,
1486
+ "step": 1640
1487
+ }
1488
+ ],
1489
+ "logging_steps": 10,
1490
+ "max_steps": 4926,
1491
+ "num_input_tokens_seen": 0,
1492
+ "num_train_epochs": 3,
1493
+ "save_steps": 500,
1494
+ "stateful_callbacks": {
1495
+ "TrainerControl": {
1496
+ "args": {
1497
+ "should_epoch_stop": false,
1498
+ "should_evaluate": false,
1499
+ "should_log": false,
1500
+ "should_save": true,
1501
+ "should_training_stop": false
1502
+ },
1503
+ "attributes": {}
1504
+ }
1505
+ },
1506
+ "total_flos": 2.6993952090530775e+18,
1507
+ "train_batch_size": 1,
1508
+ "trial_name": null,
1509
+ "trial_params": null
1510
+ }
checkpoint-1642/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d57fe99d74b7e16ba38edb5265078ef5a69a65f6b630b2ca3feaacdb770f49e
3
+ size 6161
checkpoint-3284/README.md ADDED
@@ -0,0 +1,208 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: openai/gpt-oss-20b
3
+ library_name: peft
4
+ tags:
5
+ - base_model:adapter:openai/gpt-oss-20b
6
+ - lora
7
+ - sft
8
+ - transformers
9
+ - trl
10
+ ---
11
+
12
+ # Model Card for Model ID
13
+
14
+ <!-- Provide a quick summary of what the model is/does. -->
15
+
16
+
17
+
18
+ ## Model Details
19
+
20
+ ### Model Description
21
+
22
+ <!-- Provide a longer summary of what this model is. -->
23
+
24
+
25
+
26
+ - **Developed by:** [More Information Needed]
27
+ - **Funded by [optional]:** [More Information Needed]
28
+ - **Shared by [optional]:** [More Information Needed]
29
+ - **Model type:** [More Information Needed]
30
+ - **Language(s) (NLP):** [More Information Needed]
31
+ - **License:** [More Information Needed]
32
+ - **Finetuned from model [optional]:** [More Information Needed]
33
+
34
+ ### Model Sources [optional]
35
+
36
+ <!-- Provide the basic links for the model. -->
37
+
38
+ - **Repository:** [More Information Needed]
39
+ - **Paper [optional]:** [More Information Needed]
40
+ - **Demo [optional]:** [More Information Needed]
41
+
42
+ ## Uses
43
+
44
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
45
+
46
+ ### Direct Use
47
+
48
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
49
+
50
+ [More Information Needed]
51
+
52
+ ### Downstream Use [optional]
53
+
54
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
55
+
56
+ [More Information Needed]
57
+
58
+ ### Out-of-Scope Use
59
+
60
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
61
+
62
+ [More Information Needed]
63
+
64
+ ## Bias, Risks, and Limitations
65
+
66
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
67
+
68
+ [More Information Needed]
69
+
70
+ ### Recommendations
71
+
72
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
73
+
74
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
75
+
76
+ ## How to Get Started with the Model
77
+
78
+ Use the code below to get started with the model.
79
+
80
+ [More Information Needed]
81
+
82
+ ## Training Details
83
+
84
+ ### Training Data
85
+
86
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
87
+
88
+ [More Information Needed]
89
+
90
+ ### Training Procedure
91
+
92
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
93
+
94
+ #### Preprocessing [optional]
95
+
96
+ [More Information Needed]
97
+
98
+
99
+ #### Training Hyperparameters
100
+
101
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
102
+
103
+ #### Speeds, Sizes, Times [optional]
104
+
105
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
106
+
107
+ [More Information Needed]
108
+
109
+ ## Evaluation
110
+
111
+ <!-- This section describes the evaluation protocols and provides the results. -->
112
+
113
+ ### Testing Data, Factors & Metrics
114
+
115
+ #### Testing Data
116
+
117
+ <!-- This should link to a Dataset Card if possible. -->
118
+
119
+ [More Information Needed]
120
+
121
+ #### Factors
122
+
123
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
124
+
125
+ [More Information Needed]
126
+
127
+ #### Metrics
128
+
129
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
130
+
131
+ [More Information Needed]
132
+
133
+ ### Results
134
+
135
+ [More Information Needed]
136
+
137
+ #### Summary
138
+
139
+
140
+
141
+ ## Model Examination [optional]
142
+
143
+ <!-- Relevant interpretability work for the model goes here -->
144
+
145
+ [More Information Needed]
146
+
147
+ ## Environmental Impact
148
+
149
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
150
+
151
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
152
+
153
+ - **Hardware Type:** [More Information Needed]
154
+ - **Hours used:** [More Information Needed]
155
+ - **Cloud Provider:** [More Information Needed]
156
+ - **Compute Region:** [More Information Needed]
157
+ - **Carbon Emitted:** [More Information Needed]
158
+
159
+ ## Technical Specifications [optional]
160
+
161
+ ### Model Architecture and Objective
162
+
163
+ [More Information Needed]
164
+
165
+ ### Compute Infrastructure
166
+
167
+ [More Information Needed]
168
+
169
+ #### Hardware
170
+
171
+ [More Information Needed]
172
+
173
+ #### Software
174
+
175
+ [More Information Needed]
176
+
177
+ ## Citation [optional]
178
+
179
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
180
+
181
+ **BibTeX:**
182
+
183
+ [More Information Needed]
184
+
185
+ **APA:**
186
+
187
+ [More Information Needed]
188
+
189
+ ## Glossary [optional]
190
+
191
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
192
+
193
+ [More Information Needed]
194
+
195
+ ## More Information [optional]
196
+
197
+ [More Information Needed]
198
+
199
+ ## Model Card Authors [optional]
200
+
201
+ [More Information Needed]
202
+
203
+ ## Model Card Contact
204
+
205
+ [More Information Needed]
206
+ ### Framework versions
207
+
208
+ - PEFT 0.17.1
checkpoint-3284/adapter_config.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "GptOssForCausalLM",
5
+ "parent_library": "transformers.models.gpt_oss.modeling_gpt_oss"
6
+ },
7
+ "base_model_name_or_path": "openai/gpt-oss-20b",
8
+ "bias": "none",
9
+ "corda_config": null,
10
+ "eva_config": null,
11
+ "exclude_modules": null,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": true,
15
+ "layer_replication": null,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "loftq_config": {},
19
+ "lora_alpha": 16,
20
+ "lora_bias": false,
21
+ "lora_dropout": 0.0,
22
+ "megatron_config": null,
23
+ "megatron_core": "megatron.core",
24
+ "modules_to_save": null,
25
+ "peft_type": "LORA",
26
+ "qalora_group_size": 16,
27
+ "r": 8,
28
+ "rank_pattern": {},
29
+ "revision": null,
30
+ "target_modules": [
31
+ "o_proj",
32
+ "k_proj",
33
+ "v_proj",
34
+ "q_proj"
35
+ ],
36
+ "target_parameters": [
37
+ "7.mlp.experts.gate_up_proj",
38
+ "7.mlp.experts.down_proj",
39
+ "15.mlp.experts.gate_up_proj",
40
+ "15.mlp.experts.down_proj",
41
+ "23.mlp.experts.gate_up_proj",
42
+ "23.mlp.experts.down_proj"
43
+ ],
44
+ "task_type": null,
45
+ "trainable_token_indices": null,
46
+ "use_dora": false,
47
+ "use_qalora": false,
48
+ "use_rslora": false
49
+ }
checkpoint-3284/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:863cffb057e314cefc4b79ade1f0ec14ceffa2ba036738faf8f97bd97cd0ceba
3
+ size 2366470368
checkpoint-3284/chat_template.jinja ADDED
@@ -0,0 +1,331 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {#-
2
+ In addition to the normal inputs of `messages` and `tools`, this template also accepts the
3
+ following kwargs:
4
+ - "builtin_tools": A list, can contain "browser" and/or "python".
5
+ - "model_identity": A string that optionally describes the model identity.
6
+ - "reasoning_effort": A string that describes the reasoning effort, defaults to "medium".
7
+ #}
8
+
9
+ {#- Tool Definition Rendering ============================================== #}
10
+ {%- macro render_typescript_type(param_spec, required_params, is_nullable=false) -%}
11
+ {%- if param_spec.type == "array" -%}
12
+ {%- if param_spec['items'] -%}
13
+ {%- if param_spec['items']['type'] == "string" -%}
14
+ {{- "string[]" }}
15
+ {%- elif param_spec['items']['type'] == "number" -%}
16
+ {{- "number[]" }}
17
+ {%- elif param_spec['items']['type'] == "integer" -%}
18
+ {{- "number[]" }}
19
+ {%- elif param_spec['items']['type'] == "boolean" -%}
20
+ {{- "boolean[]" }}
21
+ {%- else -%}
22
+ {%- set inner_type = render_typescript_type(param_spec['items'], required_params) -%}
23
+ {%- if inner_type == "object | object" or inner_type|length > 50 -%}
24
+ {{- "any[]" }}
25
+ {%- else -%}
26
+ {{- inner_type + "[]" }}
27
+ {%- endif -%}
28
+ {%- endif -%}
29
+ {%- if param_spec.nullable -%}
30
+ {{- " | null" }}
31
+ {%- endif -%}
32
+ {%- else -%}
33
+ {{- "any[]" }}
34
+ {%- if param_spec.nullable -%}
35
+ {{- " | null" }}
36
+ {%- endif -%}
37
+ {%- endif -%}
38
+ {%- elif param_spec.type is defined and param_spec.type is iterable and param_spec.type is not string and param_spec.type is not mapping and param_spec.type[0] is defined -%}
39
+ {#- Handle array of types like ["object", "object"] from Union[dict, list] #}
40
+ {%- if param_spec.type | length > 1 -%}
41
+ {{- param_spec.type | join(" | ") }}
42
+ {%- else -%}
43
+ {{- param_spec.type[0] }}
44
+ {%- endif -%}
45
+ {%- elif param_spec.oneOf -%}
46
+ {#- Handle oneOf schemas - check for complex unions and fallback to any #}
47
+ {%- set has_object_variants = false -%}
48
+ {%- for variant in param_spec.oneOf -%}
49
+ {%- if variant.type == "object" -%}
50
+ {%- set has_object_variants = true -%}
51
+ {%- endif -%}
52
+ {%- endfor -%}
53
+ {%- if has_object_variants and param_spec.oneOf|length > 1 -%}
54
+ {{- "any" }}
55
+ {%- else -%}
56
+ {%- for variant in param_spec.oneOf -%}
57
+ {{- render_typescript_type(variant, required_params) -}}
58
+ {%- if variant.description %}
59
+ {{- "// " + variant.description }}
60
+ {%- endif -%}
61
+ {%- if variant.default is defined %}
62
+ {{ "// default: " + variant.default|tojson }}
63
+ {%- endif -%}
64
+ {%- if not loop.last %}
65
+ {{- " | " }}
66
+ {% endif -%}
67
+ {%- endfor -%}
68
+ {%- endif -%}
69
+ {%- elif param_spec.type == "string" -%}
70
+ {%- if param_spec.enum -%}
71
+ {{- '"' + param_spec.enum|join('" | "') + '"' -}}
72
+ {%- else -%}
73
+ {{- "string" }}
74
+ {%- if param_spec.nullable %}
75
+ {{- " | null" }}
76
+ {%- endif -%}
77
+ {%- endif -%}
78
+ {%- elif param_spec.type == "number" -%}
79
+ {{- "number" }}
80
+ {%- elif param_spec.type == "integer" -%}
81
+ {{- "number" }}
82
+ {%- elif param_spec.type == "boolean" -%}
83
+ {{- "boolean" }}
84
+
85
+ {%- elif param_spec.type == "object" -%}
86
+ {%- if param_spec.properties -%}
87
+ {{- "{\n" }}
88
+ {%- for prop_name, prop_spec in param_spec.properties.items() -%}
89
+ {{- prop_name -}}
90
+ {%- if prop_name not in (param_spec.required or []) -%}
91
+ {{- "?" }}
92
+ {%- endif -%}
93
+ {{- ": " }}
94
+ {{ render_typescript_type(prop_spec, param_spec.required or []) }}
95
+ {%- if not loop.last -%}
96
+ {{-", " }}
97
+ {%- endif -%}
98
+ {%- endfor -%}
99
+ {{- "}" }}
100
+ {%- else -%}
101
+ {{- "object" }}
102
+ {%- endif -%}
103
+ {%- else -%}
104
+ {{- "any" }}
105
+ {%- endif -%}
106
+ {%- endmacro -%}
107
+
108
+ {%- macro render_tool_namespace(namespace_name, tools) -%}
109
+ {{- "## " + namespace_name + "\n\n" }}
110
+ {{- "namespace " + namespace_name + " {\n\n" }}
111
+ {%- for tool in tools %}
112
+ {%- set tool = tool.function %}
113
+ {{- "// " + tool.description + "\n" }}
114
+ {{- "type "+ tool.name + " = " }}
115
+ {%- if tool.parameters and tool.parameters.properties %}
116
+ {{- "(_: {\n" }}
117
+ {%- for param_name, param_spec in tool.parameters.properties.items() %}
118
+ {%- if param_spec.description %}
119
+ {{- "// " + param_spec.description + "\n" }}
120
+ {%- endif %}
121
+ {{- param_name }}
122
+ {%- if param_name not in (tool.parameters.required or []) -%}
123
+ {{- "?" }}
124
+ {%- endif -%}
125
+ {{- ": " }}
126
+ {{- render_typescript_type(param_spec, tool.parameters.required or []) }}
127
+ {%- if param_spec.default is defined -%}
128
+ {%- if param_spec.enum %}
129
+ {{- ", // default: " + param_spec.default }}
130
+ {%- elif param_spec.oneOf %}
131
+ {{- "// default: " + param_spec.default }}
132
+ {%- else %}
133
+ {{- ", // default: " + param_spec.default|tojson }}
134
+ {%- endif -%}
135
+ {%- endif -%}
136
+ {%- if not loop.last %}
137
+ {{- ",\n" }}
138
+ {%- else %}
139
+ {{- ",\n" }}
140
+ {%- endif -%}
141
+ {%- endfor %}
142
+ {{- "}) => any;\n\n" }}
143
+ {%- else -%}
144
+ {{- "() => any;\n\n" }}
145
+ {%- endif -%}
146
+ {%- endfor %}
147
+ {{- "} // namespace " + namespace_name }}
148
+ {%- endmacro -%}
149
+
150
+ {%- macro render_builtin_tools(browser_tool, python_tool) -%}
151
+ {%- if browser_tool %}
152
+ {{- "## browser\n\n" }}
153
+ {{- "// Tool for browsing.\n" }}
154
+ {{- "// The `cursor` appears in brackets before each browsing display: `[{cursor}]`.\n" }}
155
+ {{- "// Cite information from the tool using the following format:\n" }}
156
+ {{- "// `【{cursor}†L{line_start}(-L{line_end})?】`, for example: `【6†L9-L11】` or `【8†L3】`.\n" }}
157
+ {{- "// Do not quote more than 10 words directly from the tool output.\n" }}
158
+ {{- "// sources=web (default: web)\n" }}
159
+ {{- "namespace browser {\n\n" }}
160
+ {{- "// Searches for information related to `query` and displays `topn` results.\n" }}
161
+ {{- "type search = (_: {\n" }}
162
+ {{- "query: string,\n" }}
163
+ {{- "topn?: number, // default: 10\n" }}
164
+ {{- "source?: string,\n" }}
165
+ {{- "}) => any;\n\n" }}
166
+ {{- "// Opens the link `id` from the page indicated by `cursor` starting at line number `loc`, showing `num_lines` lines.\n" }}
167
+ {{- "// Valid link ids are displayed with the formatting: `【{id}†.*】`.\n" }}
168
+ {{- "// If `cursor` is not provided, the most recent page is implied.\n" }}
169
+ {{- "// If `id` is a string, it is treated as a fully qualified URL associated with `source`.\n" }}
170
+ {{- "// If `loc` is not provided, the viewport will be positioned at the beginning of the document or centered on the most relevant passage, if available.\n" }}
171
+ {{- "// Use this function without `id` to scroll to a new location of an opened page.\n" }}
172
+ {{- "type open = (_: {\n" }}
173
+ {{- "id?: number | string, // default: -1\n" }}
174
+ {{- "cursor?: number, // default: -1\n" }}
175
+ {{- "loc?: number, // default: -1\n" }}
176
+ {{- "num_lines?: number, // default: -1\n" }}
177
+ {{- "view_source?: boolean, // default: false\n" }}
178
+ {{- "source?: string,\n" }}
179
+ {{- "}) => any;\n\n" }}
180
+ {{- "// Finds exact matches of `pattern` in the current page, or the page given by `cursor`.\n" }}
181
+ {{- "type find = (_: {\n" }}
182
+ {{- "pattern: string,\n" }}
183
+ {{- "cursor?: number, // default: -1\n" }}
184
+ {{- "}) => any;\n\n" }}
185
+ {{- "} // namespace browser\n\n" }}
186
+ {%- endif -%}
187
+
188
+ {%- if python_tool %}
189
+ {{- "## python\n\n" }}
190
+ {{- "Use this tool to execute Python code in your chain of thought. The code will not be shown to the user. This tool should be used for internal reasoning, but not for code that is intended to be visible to the user (e.g. when creating plots, tables, or files).\n\n" }}
191
+ {{- "When you send a message containing Python code to python, it will be executed in a stateful Jupyter notebook environment. python will respond with the output of the execution or time out after 120.0 seconds. The drive at '/mnt/data' can be used to save and persist user files. Internet access for this session is UNKNOWN. Depends on the cluster.\n\n" }}
192
+ {%- endif -%}
193
+ {%- endmacro -%}
194
+
195
+ {#- System Message Construction ============================================ #}
196
+ {%- macro build_system_message() -%}
197
+ {%- if model_identity is not defined %}
198
+ {%- set model_identity = "You are ChatGPT, a large language model trained by OpenAI." %}
199
+ {%- endif %}
200
+ {{- model_identity + "\n" }}
201
+ {{- "Knowledge cutoff: 2024-06\n" }}
202
+ {{- "Current date: " + strftime_now("%Y-%m-%d") + "\n\n" }}
203
+ {%- if reasoning_effort is not defined %}
204
+ {%- set reasoning_effort = "medium" %}
205
+ {%- endif %}
206
+ {{- "Reasoning: " + reasoning_effort + "\n\n" }}
207
+ {%- if builtin_tools %}
208
+ {{- "# Tools\n\n" }}
209
+ {%- set available_builtin_tools = namespace(browser=false, python=false) %}
210
+ {%- for tool in builtin_tools %}
211
+ {%- if tool == "browser" %}
212
+ {%- set available_builtin_tools.browser = true %}
213
+ {%- elif tool == "python" %}
214
+ {%- set available_builtin_tools.python = true %}
215
+ {%- endif %}
216
+ {%- endfor %}
217
+ {{- render_builtin_tools(available_builtin_tools.browser, available_builtin_tools.python) }}
218
+ {%- endif -%}
219
+ {{- "# Valid channels: analysis, commentary, final. Channel must be included for every message." }}
220
+ {%- if tools -%}
221
+ {{- "\nCalls to these tools must go to the commentary channel: 'functions'." }}
222
+ {%- endif -%}
223
+ {%- endmacro -%}
224
+
225
+ {#- Main Template Logic ================================================= #}
226
+ {#- Set defaults #}
227
+
228
+ {#- Render system message #}
229
+ {{- "<|start|>system<|message|>" }}
230
+ {{- build_system_message() }}
231
+ {{- "<|end|>" }}
232
+
233
+ {#- Extract developer message #}
234
+ {%- if messages[0].role == "developer" or messages[0].role == "system" %}
235
+ {%- set developer_message = messages[0].content %}
236
+ {%- set loop_messages = messages[1:] %}
237
+ {%- else %}
238
+ {%- set developer_message = "" %}
239
+ {%- set loop_messages = messages %}
240
+ {%- endif %}
241
+
242
+ {#- Render developer message #}
243
+ {%- if developer_message or tools %}
244
+ {{- "<|start|>developer<|message|>" }}
245
+ {%- if developer_message %}
246
+ {{- "# Instructions\n\n" }}
247
+ {{- developer_message }}
248
+ {{- "\n\n" }}
249
+ {%- endif %}
250
+ {%- if tools -%}
251
+ {{- "# Tools\n\n" }}
252
+ {{- render_tool_namespace("functions", tools) }}
253
+ {%- endif -%}
254
+ {{- "<|end|>" }}
255
+ {%- endif %}
256
+
257
+ {#- Render messages #}
258
+ {%- set last_tool_call = namespace(name=none) %}
259
+ {%- for message in loop_messages -%}
260
+ {#- At this point only assistant/user/tool messages should remain #}
261
+ {%- if message.role == 'assistant' -%}
262
+ {#- Checks to ensure the messages are being passed in the format we expect #}
263
+ {%- if "content" in message %}
264
+ {%- if "<|channel|>analysis<|message|>" in message.content or "<|channel|>final<|message|>" in message.content %}
265
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the content field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
266
+ {%- endif %}
267
+ {%- endif %}
268
+ {%- if "thinking" in message %}
269
+ {%- if "<|channel|>analysis<|message|>" in message.thinking or "<|channel|>final<|message|>" in message.thinking %}
270
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the thinking field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
271
+ {%- endif %}
272
+ {%- endif %}
273
+ {%- if "tool_calls" in message %}
274
+ {#- We need very careful handling here - we want to drop the tool call analysis message if the model #}
275
+ {#- has output a later <|final|> message, but otherwise we want to retain it. This is the only case #}
276
+ {#- when we render CoT/analysis messages in inference. #}
277
+ {%- set future_final_message = namespace(found=false) %}
278
+ {%- for future_message in loop_messages[loop.index:] %}
279
+ {%- if future_message.role == 'assistant' and "tool_calls" not in future_message %}
280
+ {%- set future_final_message.found = true %}
281
+ {%- endif %}
282
+ {%- endfor %}
283
+ {#- We assume max 1 tool call per message, and so we infer the tool call name #}
284
+ {#- in "tool" messages from the most recent assistant tool call name #}
285
+ {%- set tool_call = message.tool_calls[0] %}
286
+ {%- if tool_call.function %}
287
+ {%- set tool_call = tool_call.function %}
288
+ {%- endif %}
289
+ {%- if message.content and message.thinking %}
290
+ {{- raise_exception("Cannot pass both content and thinking in an assistant message with tool calls! Put the analysis message in one or the other, but not both.") }}
291
+ {%- elif message.content and not future_final_message.found %}
292
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.content + "<|end|>" }}
293
+ {%- elif message.thinking and not future_final_message.found %}
294
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
295
+ {%- endif %}
296
+ {{- "<|start|>assistant to=" }}
297
+ {{- "functions." + tool_call.name + "<|channel|>commentary " }}
298
+ {{- (tool_call.content_type if tool_call.content_type is defined else "json") + "<|message|>" }}
299
+ {{- tool_call.arguments|tojson }}
300
+ {{- "<|call|>" }}
301
+ {%- set last_tool_call.name = tool_call.name %}
302
+ {%- elif loop.last and not add_generation_prompt %}
303
+ {#- Only render the CoT if the final turn is an assistant turn and add_generation_prompt is false #}
304
+ {#- This is a situation that should only occur in training, never in inference. #}
305
+ {%- if "thinking" in message %}
306
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
307
+ {%- endif %}
308
+ {#- <|return|> indicates the end of generation, but <|end|> does not #}
309
+ {#- <|return|> should never be an input to the model, but we include it as the final token #}
310
+ {#- when training, so the model learns to emit it. #}
311
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|return|>" }}
312
+ {%- else %}
313
+ {#- CoT is dropped during all previous turns, so we never render it for inference #}
314
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|end|>" }}
315
+ {%- set last_tool_call.name = none %}
316
+ {%- endif %}
317
+ {%- elif message.role == 'tool' -%}
318
+ {%- if last_tool_call.name is none %}
319
+ {{- raise_exception("Message has tool role, but there was no previous assistant message with a tool call!") }}
320
+ {%- endif %}
321
+ {{- "<|start|>functions." + last_tool_call.name }}
322
+ {{- " to=assistant<|channel|>commentary<|message|>" + message.content|tojson + "<|end|>" }}
323
+ {%- elif message.role == 'user' -%}
324
+ {{- "<|start|>user<|message|>" + message.content + "<|end|>" }}
325
+ {%- endif -%}
326
+ {%- endfor -%}
327
+
328
+ {#- Generation prompt #}
329
+ {%- if add_generation_prompt -%}
330
+ <|start|>assistant
331
+ {%- endif -%}
checkpoint-3284/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f31431c1c610dd489524726e1e535570f80ad216979b4133ca46b6b1395c50c0
3
+ size 120495883
checkpoint-3284/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bfe1981024ef92f2da08a90c72c7c793d1cc9de1547abd2556c968be70232eb
3
+ size 16389
checkpoint-3284/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a35b845d476d830805793c3dcf8ac2daad87fec289bff3f7eda9e72fc374eda1
3
+ size 16389
checkpoint-3284/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03e9880996b01262a807d1ec3ebd91eee540e08130a14a45a4648731fd0d48a9
3
+ size 16389
checkpoint-3284/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee25c237d6fe62ec76adcf7daf899d7ed32eab5d1a5b447b911f4451c9a1b258
3
+ size 16389
checkpoint-3284/rng_state_4.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a6b31133f29a8fc0cb538aa807d6a403bd51939336bfd425cd3d122d8c5595c
3
+ size 16389
checkpoint-3284/rng_state_5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a26c55b5c7fa0522b1d27b2c00a7ea77ad010f19a1321991165c5c972b8fa97a
3
+ size 16389
checkpoint-3284/rng_state_6.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a1a3cf85626196804f25a8293e22dc561bba068a70fb123e04afe4896c33972
3
+ size 16389
checkpoint-3284/rng_state_7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28f87c1ee5f5db346c7b913137cbccd196eaf8ec5a4cf9f192418a3069269b49
3
+ size 16389
checkpoint-3284/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e9aa280844c8740ef7748b8e17553210dcb3a3e5062e357e0434caf53ebef75
3
+ size 1465
checkpoint-3284/special_tokens_map.json ADDED
@@ -0,0 +1,1817 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "AAD",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ {
11
+ "content": "AArch64",
12
+ "lstrip": false,
13
+ "normalized": false,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ {
18
+ "content": "ACL",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ },
24
+ {
25
+ "content": "AD",
26
+ "lstrip": false,
27
+ "normalized": false,
28
+ "rstrip": false,
29
+ "single_word": false
30
+ },
31
+ {
32
+ "content": "AES",
33
+ "lstrip": false,
34
+ "normalized": false,
35
+ "rstrip": false,
36
+ "single_word": false
37
+ },
38
+ {
39
+ "content": "AES256GCM",
40
+ "lstrip": false,
41
+ "normalized": false,
42
+ "rstrip": false,
43
+ "single_word": false
44
+ },
45
+ {
46
+ "content": "AESCBC",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false
51
+ },
52
+ {
53
+ "content": "AKE",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false
58
+ },
59
+ {
60
+ "content": "AON",
61
+ "lstrip": false,
62
+ "normalized": false,
63
+ "rstrip": false,
64
+ "single_word": false
65
+ },
66
+ {
67
+ "content": "ASID",
68
+ "lstrip": false,
69
+ "normalized": false,
70
+ "rstrip": false,
71
+ "single_word": false
72
+ },
73
+ {
74
+ "content": "AXI",
75
+ "lstrip": false,
76
+ "normalized": false,
77
+ "rstrip": false,
78
+ "single_word": false
79
+ },
80
+ {
81
+ "content": "Acronym",
82
+ "lstrip": false,
83
+ "normalized": false,
84
+ "rstrip": false,
85
+ "single_word": false
86
+ },
87
+ {
88
+ "content": "AoU",
89
+ "lstrip": false,
90
+ "normalized": false,
91
+ "rstrip": false,
92
+ "single_word": false
93
+ },
94
+ {
95
+ "content": "AutoSar",
96
+ "lstrip": false,
97
+ "normalized": false,
98
+ "rstrip": false,
99
+ "single_word": false
100
+ },
101
+ {
102
+ "content": "BAM",
103
+ "lstrip": false,
104
+ "normalized": false,
105
+ "rstrip": false,
106
+ "single_word": false
107
+ },
108
+ {
109
+ "content": "BCH",
110
+ "lstrip": false,
111
+ "normalized": false,
112
+ "rstrip": false,
113
+ "single_word": false
114
+ },
115
+ {
116
+ "content": "BIST",
117
+ "lstrip": false,
118
+ "normalized": false,
119
+ "rstrip": false,
120
+ "single_word": false
121
+ },
122
+ {
123
+ "content": "BOM",
124
+ "lstrip": false,
125
+ "normalized": false,
126
+ "rstrip": false,
127
+ "single_word": false
128
+ },
129
+ {
130
+ "content": "BPMP",
131
+ "lstrip": false,
132
+ "normalized": false,
133
+ "rstrip": false,
134
+ "single_word": false
135
+ },
136
+ {
137
+ "content": "BPS",
138
+ "lstrip": false,
139
+ "normalized": false,
140
+ "rstrip": false,
141
+ "single_word": false
142
+ },
143
+ {
144
+ "content": "BPU",
145
+ "lstrip": false,
146
+ "normalized": false,
147
+ "rstrip": false,
148
+ "single_word": false
149
+ },
150
+ {
151
+ "content": "BRBCT",
152
+ "lstrip": false,
153
+ "normalized": false,
154
+ "rstrip": false,
155
+ "single_word": false
156
+ },
157
+ {
158
+ "content": "BW",
159
+ "lstrip": false,
160
+ "normalized": false,
161
+ "rstrip": false,
162
+ "single_word": false
163
+ },
164
+ {
165
+ "content": "C2C",
166
+ "lstrip": false,
167
+ "normalized": false,
168
+ "rstrip": false,
169
+ "single_word": false
170
+ },
171
+ {
172
+ "content": "CA",
173
+ "lstrip": false,
174
+ "normalized": false,
175
+ "rstrip": false,
176
+ "single_word": false
177
+ },
178
+ {
179
+ "content": "CAN",
180
+ "lstrip": false,
181
+ "normalized": false,
182
+ "rstrip": false,
183
+ "single_word": false
184
+ },
185
+ {
186
+ "content": "CANFD",
187
+ "lstrip": false,
188
+ "normalized": false,
189
+ "rstrip": false,
190
+ "single_word": false
191
+ },
192
+ {
193
+ "content": "CAR",
194
+ "lstrip": false,
195
+ "normalized": false,
196
+ "rstrip": false,
197
+ "single_word": false
198
+ },
199
+ {
200
+ "content": "CAVP",
201
+ "lstrip": false,
202
+ "normalized": false,
203
+ "rstrip": false,
204
+ "single_word": false
205
+ },
206
+ {
207
+ "content": "CBB",
208
+ "lstrip": false,
209
+ "normalized": false,
210
+ "rstrip": false,
211
+ "single_word": false
212
+ },
213
+ {
214
+ "content": "CBC",
215
+ "lstrip": false,
216
+ "normalized": false,
217
+ "rstrip": false,
218
+ "single_word": false
219
+ },
220
+ {
221
+ "content": "CBR",
222
+ "lstrip": false,
223
+ "normalized": false,
224
+ "rstrip": false,
225
+ "single_word": false
226
+ },
227
+ {
228
+ "content": "CCM",
229
+ "lstrip": false,
230
+ "normalized": false,
231
+ "rstrip": false,
232
+ "single_word": false
233
+ },
234
+ {
235
+ "content": "CCPLEX",
236
+ "lstrip": false,
237
+ "normalized": false,
238
+ "rstrip": false,
239
+ "single_word": false
240
+ },
241
+ {
242
+ "content": "CCPLEX_L2",
243
+ "lstrip": false,
244
+ "normalized": false,
245
+ "rstrip": false,
246
+ "single_word": false
247
+ },
248
+ {
249
+ "content": "CCPLEX_MISC",
250
+ "lstrip": false,
251
+ "normalized": false,
252
+ "rstrip": false,
253
+ "single_word": false
254
+ },
255
+ {
256
+ "content": "CCPLEX_SCF",
257
+ "lstrip": false,
258
+ "normalized": false,
259
+ "rstrip": false,
260
+ "single_word": false
261
+ },
262
+ {
263
+ "content": "CDD",
264
+ "lstrip": false,
265
+ "normalized": false,
266
+ "rstrip": false,
267
+ "single_word": false
268
+ },
269
+ {
270
+ "content": "CIF",
271
+ "lstrip": false,
272
+ "normalized": false,
273
+ "rstrip": false,
274
+ "single_word": false
275
+ },
276
+ {
277
+ "content": "CMAC",
278
+ "lstrip": false,
279
+ "normalized": false,
280
+ "rstrip": false,
281
+ "single_word": false
282
+ },
283
+ {
284
+ "content": "CPE",
285
+ "lstrip": false,
286
+ "normalized": false,
287
+ "rstrip": false,
288
+ "single_word": false
289
+ },
290
+ {
291
+ "content": "CPU",
292
+ "lstrip": false,
293
+ "normalized": false,
294
+ "rstrip": false,
295
+ "single_word": false
296
+ },
297
+ {
298
+ "content": "CRC",
299
+ "lstrip": false,
300
+ "normalized": false,
301
+ "rstrip": false,
302
+ "single_word": false
303
+ },
304
+ {
305
+ "content": "CSI",
306
+ "lstrip": false,
307
+ "normalized": false,
308
+ "rstrip": false,
309
+ "single_word": false
310
+ },
311
+ {
312
+ "content": "CSP",
313
+ "lstrip": false,
314
+ "normalized": false,
315
+ "rstrip": false,
316
+ "single_word": false
317
+ },
318
+ {
319
+ "content": "CTR",
320
+ "lstrip": false,
321
+ "normalized": false,
322
+ "rstrip": false,
323
+ "single_word": false
324
+ },
325
+ {
326
+ "content": "CTXT",
327
+ "lstrip": false,
328
+ "normalized": false,
329
+ "rstrip": false,
330
+ "single_word": false
331
+ },
332
+ {
333
+ "content": "CV",
334
+ "lstrip": false,
335
+ "normalized": false,
336
+ "rstrip": false,
337
+ "single_word": false
338
+ },
339
+ {
340
+ "content": "DBB",
341
+ "lstrip": false,
342
+ "normalized": false,
343
+ "rstrip": false,
344
+ "single_word": false
345
+ },
346
+ {
347
+ "content": "DEP",
348
+ "lstrip": false,
349
+ "normalized": false,
350
+ "rstrip": false,
351
+ "single_word": false
352
+ },
353
+ {
354
+ "content": "DEV",
355
+ "lstrip": false,
356
+ "normalized": false,
357
+ "rstrip": false,
358
+ "single_word": false
359
+ },
360
+ {
361
+ "content": "DFA",
362
+ "lstrip": false,
363
+ "normalized": false,
364
+ "rstrip": false,
365
+ "single_word": false
366
+ },
367
+ {
368
+ "content": "DFT",
369
+ "lstrip": false,
370
+ "normalized": false,
371
+ "rstrip": false,
372
+ "single_word": false
373
+ },
374
+ {
375
+ "content": "DIP",
376
+ "lstrip": false,
377
+ "normalized": false,
378
+ "rstrip": false,
379
+ "single_word": false
380
+ },
381
+ {
382
+ "content": "DISPLAY",
383
+ "lstrip": false,
384
+ "normalized": false,
385
+ "rstrip": false,
386
+ "single_word": false
387
+ },
388
+ {
389
+ "content": "DLA",
390
+ "lstrip": false,
391
+ "normalized": false,
392
+ "rstrip": false,
393
+ "single_word": false
394
+ },
395
+ {
396
+ "content": "DMA",
397
+ "lstrip": false,
398
+ "normalized": false,
399
+ "rstrip": false,
400
+ "single_word": false
401
+ },
402
+ {
403
+ "content": "DMEM",
404
+ "lstrip": false,
405
+ "normalized": false,
406
+ "rstrip": false,
407
+ "single_word": false
408
+ },
409
+ {
410
+ "content": "DPA",
411
+ "lstrip": false,
412
+ "normalized": false,
413
+ "rstrip": false,
414
+ "single_word": false
415
+ },
416
+ {
417
+ "content": "DSC",
418
+ "lstrip": false,
419
+ "normalized": false,
420
+ "rstrip": false,
421
+ "single_word": false
422
+ },
423
+ {
424
+ "content": "DT",
425
+ "lstrip": false,
426
+ "normalized": false,
427
+ "rstrip": false,
428
+ "single_word": false
429
+ },
430
+ {
431
+ "content": "DU",
432
+ "lstrip": false,
433
+ "normalized": false,
434
+ "rstrip": false,
435
+ "single_word": false
436
+ },
437
+ {
438
+ "content": "DVMU",
439
+ "lstrip": false,
440
+ "normalized": false,
441
+ "rstrip": false,
442
+ "single_word": false
443
+ },
444
+ {
445
+ "content": "EC",
446
+ "lstrip": false,
447
+ "normalized": false,
448
+ "rstrip": false,
449
+ "single_word": false
450
+ },
451
+ {
452
+ "content": "ECB",
453
+ "lstrip": false,
454
+ "normalized": false,
455
+ "rstrip": false,
456
+ "single_word": false
457
+ },
458
+ {
459
+ "content": "ECC",
460
+ "lstrip": false,
461
+ "normalized": false,
462
+ "rstrip": false,
463
+ "single_word": false
464
+ },
465
+ {
466
+ "content": "ECDHE",
467
+ "lstrip": false,
468
+ "normalized": false,
469
+ "rstrip": false,
470
+ "single_word": false
471
+ },
472
+ {
473
+ "content": "ECDSA",
474
+ "lstrip": false,
475
+ "normalized": false,
476
+ "rstrip": false,
477
+ "single_word": false
478
+ },
479
+ {
480
+ "content": "ECID",
481
+ "lstrip": false,
482
+ "normalized": false,
483
+ "rstrip": false,
484
+ "single_word": false
485
+ },
486
+ {
487
+ "content": "EDR",
488
+ "lstrip": false,
489
+ "normalized": false,
490
+ "rstrip": false,
491
+ "single_word": false
492
+ },
493
+ {
494
+ "content": "EOF",
495
+ "lstrip": false,
496
+ "normalized": false,
497
+ "rstrip": false,
498
+ "single_word": false
499
+ },
500
+ {
501
+ "content": "EOTTI",
502
+ "lstrip": false,
503
+ "normalized": false,
504
+ "rstrip": false,
505
+ "single_word": false
506
+ },
507
+ {
508
+ "content": "EQoS",
509
+ "lstrip": false,
510
+ "normalized": false,
511
+ "rstrip": false,
512
+ "single_word": false
513
+ },
514
+ {
515
+ "content": "FCL",
516
+ "lstrip": false,
517
+ "normalized": false,
518
+ "rstrip": false,
519
+ "single_word": false
520
+ },
521
+ {
522
+ "content": "FHTI",
523
+ "lstrip": false,
524
+ "normalized": false,
525
+ "rstrip": false,
526
+ "single_word": false
527
+ },
528
+ {
529
+ "content": "FIPS",
530
+ "lstrip": false,
531
+ "normalized": false,
532
+ "rstrip": false,
533
+ "single_word": false
534
+ },
535
+ {
536
+ "content": "FMEA",
537
+ "lstrip": false,
538
+ "normalized": false,
539
+ "rstrip": false,
540
+ "single_word": false
541
+ },
542
+ {
543
+ "content": "FMON",
544
+ "lstrip": false,
545
+ "normalized": false,
546
+ "rstrip": false,
547
+ "single_word": false
548
+ },
549
+ {
550
+ "content": "FO",
551
+ "lstrip": false,
552
+ "normalized": false,
553
+ "rstrip": false,
554
+ "single_word": false
555
+ },
556
+ {
557
+ "content": "FP",
558
+ "lstrip": false,
559
+ "normalized": false,
560
+ "rstrip": false,
561
+ "single_word": false
562
+ },
563
+ {
564
+ "content": "FPS",
565
+ "lstrip": false,
566
+ "normalized": false,
567
+ "rstrip": false,
568
+ "single_word": false
569
+ },
570
+ {
571
+ "content": "FW",
572
+ "lstrip": false,
573
+ "normalized": false,
574
+ "rstrip": false,
575
+ "single_word": false
576
+ },
577
+ {
578
+ "content": "FuSa",
579
+ "lstrip": false,
580
+ "normalized": false,
581
+ "rstrip": false,
582
+ "single_word": false
583
+ },
584
+ {
585
+ "content": "GCM",
586
+ "lstrip": false,
587
+ "normalized": false,
588
+ "rstrip": false,
589
+ "single_word": false
590
+ },
591
+ {
592
+ "content": "GFD",
593
+ "lstrip": false,
594
+ "normalized": false,
595
+ "rstrip": false,
596
+ "single_word": false
597
+ },
598
+ {
599
+ "content": "GIC",
600
+ "lstrip": false,
601
+ "normalized": false,
602
+ "rstrip": false,
603
+ "single_word": false
604
+ },
605
+ {
606
+ "content": "GMAC",
607
+ "lstrip": false,
608
+ "normalized": false,
609
+ "rstrip": false,
610
+ "single_word": false
611
+ },
612
+ {
613
+ "content": "GMSL",
614
+ "lstrip": false,
615
+ "normalized": false,
616
+ "rstrip": false,
617
+ "single_word": false
618
+ },
619
+ {
620
+ "content": "GOP",
621
+ "lstrip": false,
622
+ "normalized": false,
623
+ "rstrip": false,
624
+ "single_word": false
625
+ },
626
+ {
627
+ "content": "GP",
628
+ "lstrip": false,
629
+ "normalized": false,
630
+ "rstrip": false,
631
+ "single_word": false
632
+ },
633
+ {
634
+ "content": "GPCDMA",
635
+ "lstrip": false,
636
+ "normalized": false,
637
+ "rstrip": false,
638
+ "single_word": false
639
+ },
640
+ {
641
+ "content": "GPU",
642
+ "lstrip": false,
643
+ "normalized": false,
644
+ "rstrip": false,
645
+ "single_word": false
646
+ },
647
+ {
648
+ "content": "GR",
649
+ "lstrip": false,
650
+ "normalized": false,
651
+ "rstrip": false,
652
+ "single_word": false
653
+ },
654
+ {
655
+ "content": "Gpps",
656
+ "lstrip": false,
657
+ "normalized": false,
658
+ "rstrip": false,
659
+ "single_word": false
660
+ },
661
+ {
662
+ "content": "HBR",
663
+ "lstrip": false,
664
+ "normalized": false,
665
+ "rstrip": false,
666
+ "single_word": false
667
+ },
668
+ {
669
+ "content": "HBR2",
670
+ "lstrip": false,
671
+ "normalized": false,
672
+ "rstrip": false,
673
+ "single_word": false
674
+ },
675
+ {
676
+ "content": "HBR3",
677
+ "lstrip": false,
678
+ "normalized": false,
679
+ "rstrip": false,
680
+ "single_word": false
681
+ },
682
+ {
683
+ "content": "HDS",
684
+ "lstrip": false,
685
+ "normalized": false,
686
+ "rstrip": false,
687
+ "single_word": false
688
+ },
689
+ {
690
+ "content": "HIS",
691
+ "lstrip": false,
692
+ "normalized": false,
693
+ "rstrip": false,
694
+ "single_word": false
695
+ },
696
+ {
697
+ "content": "HMAC",
698
+ "lstrip": false,
699
+ "normalized": false,
700
+ "rstrip": false,
701
+ "single_word": false
702
+ },
703
+ {
704
+ "content": "HPSE",
705
+ "lstrip": false,
706
+ "normalized": false,
707
+ "rstrip": false,
708
+ "single_word": false
709
+ },
710
+ {
711
+ "content": "HSI",
712
+ "lstrip": false,
713
+ "normalized": false,
714
+ "rstrip": false,
715
+ "single_word": false
716
+ },
717
+ {
718
+ "content": "HSM",
719
+ "lstrip": false,
720
+ "normalized": false,
721
+ "rstrip": false,
722
+ "single_word": false
723
+ },
724
+ {
725
+ "content": "HSP",
726
+ "lstrip": false,
727
+ "normalized": false,
728
+ "rstrip": false,
729
+ "single_word": false
730
+ },
731
+ {
732
+ "content": "HW",
733
+ "lstrip": false,
734
+ "normalized": false,
735
+ "rstrip": false,
736
+ "single_word": false
737
+ },
738
+ {
739
+ "content": "IAS",
740
+ "lstrip": false,
741
+ "normalized": false,
742
+ "rstrip": false,
743
+ "single_word": false
744
+ },
745
+ {
746
+ "content": "IC",
747
+ "lstrip": false,
748
+ "normalized": false,
749
+ "rstrip": false,
750
+ "single_word": false
751
+ },
752
+ {
753
+ "content": "ICD",
754
+ "lstrip": false,
755
+ "normalized": false,
756
+ "rstrip": false,
757
+ "single_word": false
758
+ },
759
+ {
760
+ "content": "IDR",
761
+ "lstrip": false,
762
+ "normalized": false,
763
+ "rstrip": false,
764
+ "single_word": false
765
+ },
766
+ {
767
+ "content": "IDT",
768
+ "lstrip": false,
769
+ "normalized": false,
770
+ "rstrip": false,
771
+ "single_word": false
772
+ },
773
+ {
774
+ "content": "IEP",
775
+ "lstrip": false,
776
+ "normalized": false,
777
+ "rstrip": false,
778
+ "single_word": false
779
+ },
780
+ {
781
+ "content": "IEU",
782
+ "lstrip": false,
783
+ "normalized": false,
784
+ "rstrip": false,
785
+ "single_word": false
786
+ },
787
+ {
788
+ "content": "IFU",
789
+ "lstrip": false,
790
+ "normalized": false,
791
+ "rstrip": false,
792
+ "single_word": false
793
+ },
794
+ {
795
+ "content": "IID",
796
+ "lstrip": false,
797
+ "normalized": false,
798
+ "rstrip": false,
799
+ "single_word": false
800
+ },
801
+ {
802
+ "content": "ILD",
803
+ "lstrip": false,
804
+ "normalized": false,
805
+ "rstrip": false,
806
+ "single_word": false
807
+ },
808
+ {
809
+ "content": "IMEM",
810
+ "lstrip": false,
811
+ "normalized": false,
812
+ "rstrip": false,
813
+ "single_word": false
814
+ },
815
+ {
816
+ "content": "IOC",
817
+ "lstrip": false,
818
+ "normalized": false,
819
+ "rstrip": false,
820
+ "single_word": false
821
+ },
822
+ {
823
+ "content": "IOFA",
824
+ "lstrip": false,
825
+ "normalized": false,
826
+ "rstrip": false,
827
+ "single_word": false
828
+ },
829
+ {
830
+ "content": "IOMMU",
831
+ "lstrip": false,
832
+ "normalized": false,
833
+ "rstrip": false,
834
+ "single_word": false
835
+ },
836
+ {
837
+ "content": "IPC",
838
+ "lstrip": false,
839
+ "normalized": false,
840
+ "rstrip": false,
841
+ "single_word": false
842
+ },
843
+ {
844
+ "content": "IPI",
845
+ "lstrip": false,
846
+ "normalized": false,
847
+ "rstrip": false,
848
+ "single_word": false
849
+ },
850
+ {
851
+ "content": "IRF",
852
+ "lstrip": false,
853
+ "normalized": false,
854
+ "rstrip": false,
855
+ "single_word": false
856
+ },
857
+ {
858
+ "content": "IST",
859
+ "lstrip": false,
860
+ "normalized": false,
861
+ "rstrip": false,
862
+ "single_word": false
863
+ },
864
+ {
865
+ "content": "IV",
866
+ "lstrip": false,
867
+ "normalized": false,
868
+ "rstrip": false,
869
+ "single_word": false
870
+ },
871
+ {
872
+ "content": "IoT",
873
+ "lstrip": false,
874
+ "normalized": false,
875
+ "rstrip": false,
876
+ "single_word": false
877
+ },
878
+ {
879
+ "content": "JSR",
880
+ "lstrip": false,
881
+ "normalized": false,
882
+ "rstrip": false,
883
+ "single_word": false
884
+ },
885
+ {
886
+ "content": "KAT",
887
+ "lstrip": false,
888
+ "normalized": false,
889
+ "rstrip": false,
890
+ "single_word": false
891
+ },
892
+ {
893
+ "content": "KCV",
894
+ "lstrip": false,
895
+ "normalized": false,
896
+ "rstrip": false,
897
+ "single_word": false
898
+ },
899
+ {
900
+ "content": "KDF",
901
+ "lstrip": false,
902
+ "normalized": false,
903
+ "rstrip": false,
904
+ "single_word": false
905
+ },
906
+ {
907
+ "content": "KPI",
908
+ "lstrip": false,
909
+ "normalized": false,
910
+ "rstrip": false,
911
+ "single_word": false
912
+ },
913
+ {
914
+ "content": "L1PT",
915
+ "lstrip": false,
916
+ "normalized": false,
917
+ "rstrip": false,
918
+ "single_word": false
919
+ },
920
+ {
921
+ "content": "L2C",
922
+ "lstrip": false,
923
+ "normalized": false,
924
+ "rstrip": false,
925
+ "single_word": false
926
+ },
927
+ {
928
+ "content": "L2mDIR",
929
+ "lstrip": false,
930
+ "normalized": false,
931
+ "rstrip": false,
932
+ "single_word": false
933
+ },
934
+ {
935
+ "content": "L2vDIR",
936
+ "lstrip": false,
937
+ "normalized": false,
938
+ "rstrip": false,
939
+ "single_word": false
940
+ },
941
+ {
942
+ "content": "LAB",
943
+ "lstrip": false,
944
+ "normalized": false,
945
+ "rstrip": false,
946
+ "single_word": false
947
+ },
948
+ {
949
+ "content": "LBIST",
950
+ "lstrip": false,
951
+ "normalized": false,
952
+ "rstrip": false,
953
+ "single_word": false
954
+ },
955
+ {
956
+ "content": "LDC",
957
+ "lstrip": false,
958
+ "normalized": false,
959
+ "rstrip": false,
960
+ "single_word": false
961
+ },
962
+ {
963
+ "content": "LFT",
964
+ "lstrip": false,
965
+ "normalized": false,
966
+ "rstrip": false,
967
+ "single_word": false
968
+ },
969
+ {
970
+ "content": "LIC",
971
+ "lstrip": false,
972
+ "normalized": false,
973
+ "rstrip": false,
974
+ "single_word": false
975
+ },
976
+ {
977
+ "content": "LIP",
978
+ "lstrip": false,
979
+ "normalized": false,
980
+ "rstrip": false,
981
+ "single_word": false
982
+ },
983
+ {
984
+ "content": "LSB",
985
+ "lstrip": false,
986
+ "normalized": false,
987
+ "rstrip": false,
988
+ "single_word": false
989
+ },
990
+ {
991
+ "content": "MAC",
992
+ "lstrip": false,
993
+ "normalized": false,
994
+ "rstrip": false,
995
+ "single_word": false
996
+ },
997
+ {
998
+ "content": "MAQ",
999
+ "lstrip": false,
1000
+ "normalized": false,
1001
+ "rstrip": false,
1002
+ "single_word": false
1003
+ },
1004
+ {
1005
+ "content": "MB",
1006
+ "lstrip": false,
1007
+ "normalized": false,
1008
+ "rstrip": false,
1009
+ "single_word": false
1010
+ },
1011
+ {
1012
+ "content": "MBIST",
1013
+ "lstrip": false,
1014
+ "normalized": false,
1015
+ "rstrip": false,
1016
+ "single_word": false
1017
+ },
1018
+ {
1019
+ "content": "MCAL",
1020
+ "lstrip": false,
1021
+ "normalized": false,
1022
+ "rstrip": false,
1023
+ "single_word": false
1024
+ },
1025
+ {
1026
+ "content": "MCE",
1027
+ "lstrip": false,
1028
+ "normalized": false,
1029
+ "rstrip": false,
1030
+ "single_word": false
1031
+ },
1032
+ {
1033
+ "content": "MCU",
1034
+ "lstrip": false,
1035
+ "normalized": false,
1036
+ "rstrip": false,
1037
+ "single_word": false
1038
+ },
1039
+ {
1040
+ "content": "MSB",
1041
+ "lstrip": false,
1042
+ "normalized": false,
1043
+ "rstrip": false,
1044
+ "single_word": false
1045
+ },
1046
+ {
1047
+ "content": "MSS",
1048
+ "lstrip": false,
1049
+ "normalized": false,
1050
+ "rstrip": false,
1051
+ "single_word": false
1052
+ },
1053
+ {
1054
+ "content": "MST",
1055
+ "lstrip": false,
1056
+ "normalized": false,
1057
+ "rstrip": false,
1058
+ "single_word": false
1059
+ },
1060
+ {
1061
+ "content": "MTS",
1062
+ "lstrip": false,
1063
+ "normalized": false,
1064
+ "rstrip": false,
1065
+ "single_word": false
1066
+ },
1067
+ {
1068
+ "content": "MiTM",
1069
+ "lstrip": false,
1070
+ "normalized": false,
1071
+ "rstrip": false,
1072
+ "single_word": false
1073
+ },
1074
+ {
1075
+ "content": "NIP",
1076
+ "lstrip": false,
1077
+ "normalized": false,
1078
+ "rstrip": false,
1079
+ "single_word": false
1080
+ },
1081
+ {
1082
+ "content": "NIST",
1083
+ "lstrip": false,
1084
+ "normalized": false,
1085
+ "rstrip": false,
1086
+ "single_word": false
1087
+ },
1088
+ {
1089
+ "content": "NITO",
1090
+ "lstrip": false,
1091
+ "normalized": false,
1092
+ "rstrip": false,
1093
+ "single_word": false
1094
+ },
1095
+ {
1096
+ "content": "NOC",
1097
+ "lstrip": false,
1098
+ "normalized": false,
1099
+ "rstrip": false,
1100
+ "single_word": false
1101
+ },
1102
+ {
1103
+ "content": "NOOP",
1104
+ "lstrip": false,
1105
+ "normalized": false,
1106
+ "rstrip": false,
1107
+ "single_word": false
1108
+ },
1109
+ {
1110
+ "content": "NT",
1111
+ "lstrip": false,
1112
+ "normalized": false,
1113
+ "rstrip": false,
1114
+ "single_word": false
1115
+ },
1116
+ {
1117
+ "content": "NVDEC",
1118
+ "lstrip": false,
1119
+ "normalized": false,
1120
+ "rstrip": false,
1121
+ "single_word": false
1122
+ },
1123
+ {
1124
+ "content": "NVENC",
1125
+ "lstrip": false,
1126
+ "normalized": false,
1127
+ "rstrip": false,
1128
+ "single_word": false
1129
+ },
1130
+ {
1131
+ "content": "NVJPG",
1132
+ "lstrip": false,
1133
+ "normalized": false,
1134
+ "rstrip": false,
1135
+ "single_word": false
1136
+ },
1137
+ {
1138
+ "content": "NVM",
1139
+ "lstrip": false,
1140
+ "normalized": false,
1141
+ "rstrip": false,
1142
+ "single_word": false
1143
+ },
1144
+ {
1145
+ "content": "NVVSE",
1146
+ "lstrip": false,
1147
+ "normalized": false,
1148
+ "rstrip": false,
1149
+ "single_word": false
1150
+ },
1151
+ {
1152
+ "content": "OEM",
1153
+ "lstrip": false,
1154
+ "normalized": false,
1155
+ "rstrip": false,
1156
+ "single_word": false
1157
+ },
1158
+ {
1159
+ "content": "OFA",
1160
+ "lstrip": false,
1161
+ "normalized": false,
1162
+ "rstrip": false,
1163
+ "single_word": false
1164
+ },
1165
+ {
1166
+ "content": "OS",
1167
+ "lstrip": false,
1168
+ "normalized": false,
1169
+ "rstrip": false,
1170
+ "single_word": false
1171
+ },
1172
+ {
1173
+ "content": "OSP",
1174
+ "lstrip": false,
1175
+ "normalized": false,
1176
+ "rstrip": false,
1177
+ "single_word": false
1178
+ },
1179
+ {
1180
+ "content": "OTP",
1181
+ "lstrip": false,
1182
+ "normalized": false,
1183
+ "rstrip": false,
1184
+ "single_word": false
1185
+ },
1186
+ {
1187
+ "content": "PB",
1188
+ "lstrip": false,
1189
+ "normalized": false,
1190
+ "rstrip": false,
1191
+ "single_word": false
1192
+ },
1193
+ {
1194
+ "content": "PCIE",
1195
+ "lstrip": false,
1196
+ "normalized": false,
1197
+ "rstrip": false,
1198
+ "single_word": false
1199
+ },
1200
+ {
1201
+ "content": "PCPU",
1202
+ "lstrip": false,
1203
+ "normalized": false,
1204
+ "rstrip": false,
1205
+ "single_word": false
1206
+ },
1207
+ {
1208
+ "content": "PCR",
1209
+ "lstrip": false,
1210
+ "normalized": false,
1211
+ "rstrip": false,
1212
+ "single_word": false
1213
+ },
1214
+ {
1215
+ "content": "PCT",
1216
+ "lstrip": false,
1217
+ "normalized": false,
1218
+ "rstrip": false,
1219
+ "single_word": false
1220
+ },
1221
+ {
1222
+ "content": "PDK",
1223
+ "lstrip": false,
1224
+ "normalized": false,
1225
+ "rstrip": false,
1226
+ "single_word": false
1227
+ },
1228
+ {
1229
+ "content": "PII",
1230
+ "lstrip": false,
1231
+ "normalized": false,
1232
+ "rstrip": false,
1233
+ "single_word": false
1234
+ },
1235
+ {
1236
+ "content": "PIP",
1237
+ "lstrip": false,
1238
+ "normalized": false,
1239
+ "rstrip": false,
1240
+ "single_word": false
1241
+ },
1242
+ {
1243
+ "content": "PKC",
1244
+ "lstrip": false,
1245
+ "normalized": false,
1246
+ "rstrip": false,
1247
+ "single_word": false
1248
+ },
1249
+ {
1250
+ "content": "PKCS",
1251
+ "lstrip": false,
1252
+ "normalized": false,
1253
+ "rstrip": false,
1254
+ "single_word": false
1255
+ },
1256
+ {
1257
+ "content": "PKI",
1258
+ "lstrip": false,
1259
+ "normalized": false,
1260
+ "rstrip": false,
1261
+ "single_word": false
1262
+ },
1263
+ {
1264
+ "content": "PL",
1265
+ "lstrip": false,
1266
+ "normalized": false,
1267
+ "rstrip": false,
1268
+ "single_word": false
1269
+ },
1270
+ {
1271
+ "content": "PLA",
1272
+ "lstrip": false,
1273
+ "normalized": false,
1274
+ "rstrip": false,
1275
+ "single_word": false
1276
+ },
1277
+ {
1278
+ "content": "POR",
1279
+ "lstrip": false,
1280
+ "normalized": false,
1281
+ "rstrip": false,
1282
+ "single_word": false
1283
+ },
1284
+ {
1285
+ "content": "PPC",
1286
+ "lstrip": false,
1287
+ "normalized": false,
1288
+ "rstrip": false,
1289
+ "single_word": false
1290
+ },
1291
+ {
1292
+ "content": "PSC",
1293
+ "lstrip": false,
1294
+ "normalized": false,
1295
+ "rstrip": false,
1296
+ "single_word": false
1297
+ },
1298
+ {
1299
+ "content": "PTXT",
1300
+ "lstrip": false,
1301
+ "normalized": false,
1302
+ "rstrip": false,
1303
+ "single_word": false
1304
+ },
1305
+ {
1306
+ "content": "PVA",
1307
+ "lstrip": false,
1308
+ "normalized": false,
1309
+ "rstrip": false,
1310
+ "single_word": false
1311
+ },
1312
+ {
1313
+ "content": "QNX",
1314
+ "lstrip": false,
1315
+ "normalized": false,
1316
+ "rstrip": false,
1317
+ "single_word": false
1318
+ },
1319
+ {
1320
+ "content": "QOS",
1321
+ "lstrip": false,
1322
+ "normalized": false,
1323
+ "rstrip": false,
1324
+ "single_word": false
1325
+ },
1326
+ {
1327
+ "content": "QSPI",
1328
+ "lstrip": false,
1329
+ "normalized": false,
1330
+ "rstrip": false,
1331
+ "single_word": false
1332
+ },
1333
+ {
1334
+ "content": "RBG",
1335
+ "lstrip": false,
1336
+ "normalized": false,
1337
+ "rstrip": false,
1338
+ "single_word": false
1339
+ },
1340
+ {
1341
+ "content": "RBR",
1342
+ "lstrip": false,
1343
+ "normalized": false,
1344
+ "rstrip": false,
1345
+ "single_word": false
1346
+ },
1347
+ {
1348
+ "content": "RC",
1349
+ "lstrip": false,
1350
+ "normalized": false,
1351
+ "rstrip": false,
1352
+ "single_word": false
1353
+ },
1354
+ {
1355
+ "content": "RDEV",
1356
+ "lstrip": false,
1357
+ "normalized": false,
1358
+ "rstrip": false,
1359
+ "single_word": false
1360
+ },
1361
+ {
1362
+ "content": "REE",
1363
+ "lstrip": false,
1364
+ "normalized": false,
1365
+ "rstrip": false,
1366
+ "single_word": false
1367
+ },
1368
+ {
1369
+ "content": "RMA",
1370
+ "lstrip": false,
1371
+ "normalized": false,
1372
+ "rstrip": false,
1373
+ "single_word": false
1374
+ },
1375
+ {
1376
+ "content": "RMW",
1377
+ "lstrip": false,
1378
+ "normalized": false,
1379
+ "rstrip": false,
1380
+ "single_word": false
1381
+ },
1382
+ {
1383
+ "content": "RSA",
1384
+ "lstrip": false,
1385
+ "normalized": false,
1386
+ "rstrip": false,
1387
+ "single_word": false
1388
+ },
1389
+ {
1390
+ "content": "RSB",
1391
+ "lstrip": false,
1392
+ "normalized": false,
1393
+ "rstrip": false,
1394
+ "single_word": false
1395
+ },
1396
+ {
1397
+ "content": "RTS",
1398
+ "lstrip": false,
1399
+ "normalized": false,
1400
+ "rstrip": false,
1401
+ "single_word": false
1402
+ },
1403
+ {
1404
+ "content": "RoT",
1405
+ "lstrip": false,
1406
+ "normalized": false,
1407
+ "rstrip": false,
1408
+ "single_word": false
1409
+ },
1410
+ {
1411
+ "content": "SAE",
1412
+ "lstrip": false,
1413
+ "normalized": false,
1414
+ "rstrip": false,
1415
+ "single_word": false
1416
+ },
1417
+ {
1418
+ "content": "SBK",
1419
+ "lstrip": false,
1420
+ "normalized": false,
1421
+ "rstrip": false,
1422
+ "single_word": false
1423
+ },
1424
+ {
1425
+ "content": "SCH",
1426
+ "lstrip": false,
1427
+ "normalized": false,
1428
+ "rstrip": false,
1429
+ "single_word": false
1430
+ },
1431
+ {
1432
+ "content": "SDK",
1433
+ "lstrip": false,
1434
+ "normalized": false,
1435
+ "rstrip": false,
1436
+ "single_word": false
1437
+ },
1438
+ {
1439
+ "content": "SE",
1440
+ "lstrip": false,
1441
+ "normalized": false,
1442
+ "rstrip": false,
1443
+ "single_word": false
1444
+ },
1445
+ {
1446
+ "content": "SEL0",
1447
+ "lstrip": false,
1448
+ "normalized": false,
1449
+ "rstrip": false,
1450
+ "single_word": false
1451
+ },
1452
+ {
1453
+ "content": "SEL1",
1454
+ "lstrip": false,
1455
+ "normalized": false,
1456
+ "rstrip": false,
1457
+ "single_word": false
1458
+ },
1459
+ {
1460
+ "content": "SEooC",
1461
+ "lstrip": false,
1462
+ "normalized": false,
1463
+ "rstrip": false,
1464
+ "single_word": false
1465
+ },
1466
+ {
1467
+ "content": "SGM",
1468
+ "lstrip": false,
1469
+ "normalized": false,
1470
+ "rstrip": false,
1471
+ "single_word": false
1472
+ },
1473
+ {
1474
+ "content": "SHA",
1475
+ "lstrip": false,
1476
+ "normalized": false,
1477
+ "rstrip": false,
1478
+ "single_word": false
1479
+ },
1480
+ {
1481
+ "content": "SHA256",
1482
+ "lstrip": false,
1483
+ "normalized": false,
1484
+ "rstrip": false,
1485
+ "single_word": false
1486
+ },
1487
+ {
1488
+ "content": "SHA512",
1489
+ "lstrip": false,
1490
+ "normalized": false,
1491
+ "rstrip": false,
1492
+ "single_word": false
1493
+ },
1494
+ {
1495
+ "content": "SHE",
1496
+ "lstrip": false,
1497
+ "normalized": false,
1498
+ "rstrip": false,
1499
+ "single_word": false
1500
+ },
1501
+ {
1502
+ "content": "SKU",
1503
+ "lstrip": false,
1504
+ "normalized": false,
1505
+ "rstrip": false,
1506
+ "single_word": false
1507
+ },
1508
+ {
1509
+ "content": "SNOC",
1510
+ "lstrip": false,
1511
+ "normalized": false,
1512
+ "rstrip": false,
1513
+ "single_word": false
1514
+ },
1515
+ {
1516
+ "content": "SO",
1517
+ "lstrip": false,
1518
+ "normalized": false,
1519
+ "rstrip": false,
1520
+ "single_word": false
1521
+ },
1522
+ {
1523
+ "content": "SPA",
1524
+ "lstrip": false,
1525
+ "normalized": false,
1526
+ "rstrip": false,
1527
+ "single_word": false
1528
+ },
1529
+ {
1530
+ "content": "SQ",
1531
+ "lstrip": false,
1532
+ "normalized": false,
1533
+ "rstrip": false,
1534
+ "single_word": false
1535
+ },
1536
+ {
1537
+ "content": "SSR",
1538
+ "lstrip": false,
1539
+ "normalized": false,
1540
+ "rstrip": false,
1541
+ "single_word": false
1542
+ },
1543
+ {
1544
+ "content": "SST",
1545
+ "lstrip": false,
1546
+ "normalized": false,
1547
+ "rstrip": false,
1548
+ "single_word": false
1549
+ },
1550
+ {
1551
+ "content": "SW",
1552
+ "lstrip": false,
1553
+ "normalized": false,
1554
+ "rstrip": false,
1555
+ "single_word": false
1556
+ },
1557
+ {
1558
+ "content": "SWAT",
1559
+ "lstrip": false,
1560
+ "normalized": false,
1561
+ "rstrip": false,
1562
+ "single_word": false
1563
+ },
1564
+ {
1565
+ "content": "SoC",
1566
+ "lstrip": false,
1567
+ "normalized": false,
1568
+ "rstrip": false,
1569
+ "single_word": false
1570
+ },
1571
+ {
1572
+ "content": "TA",
1573
+ "lstrip": false,
1574
+ "normalized": false,
1575
+ "rstrip": false,
1576
+ "single_word": false
1577
+ },
1578
+ {
1579
+ "content": "TCF",
1580
+ "lstrip": false,
1581
+ "normalized": false,
1582
+ "rstrip": false,
1583
+ "single_word": false
1584
+ },
1585
+ {
1586
+ "content": "TEE",
1587
+ "lstrip": false,
1588
+ "normalized": false,
1589
+ "rstrip": false,
1590
+ "single_word": false
1591
+ },
1592
+ {
1593
+ "content": "THI",
1594
+ "lstrip": false,
1595
+ "normalized": false,
1596
+ "rstrip": false,
1597
+ "single_word": false
1598
+ },
1599
+ {
1600
+ "content": "TNR",
1601
+ "lstrip": false,
1602
+ "normalized": false,
1603
+ "rstrip": false,
1604
+ "single_word": false
1605
+ },
1606
+ {
1607
+ "content": "TOS",
1608
+ "lstrip": false,
1609
+ "normalized": false,
1610
+ "rstrip": false,
1611
+ "single_word": false
1612
+ },
1613
+ {
1614
+ "content": "TRC",
1615
+ "lstrip": false,
1616
+ "normalized": false,
1617
+ "rstrip": false,
1618
+ "single_word": false
1619
+ },
1620
+ {
1621
+ "content": "TRL",
1622
+ "lstrip": false,
1623
+ "normalized": false,
1624
+ "rstrip": false,
1625
+ "single_word": false
1626
+ },
1627
+ {
1628
+ "content": "TSEC",
1629
+ "lstrip": false,
1630
+ "normalized": false,
1631
+ "rstrip": false,
1632
+ "single_word": false
1633
+ },
1634
+ {
1635
+ "content": "TZ",
1636
+ "lstrip": false,
1637
+ "normalized": false,
1638
+ "rstrip": false,
1639
+ "single_word": false
1640
+ },
1641
+ {
1642
+ "content": "UFS",
1643
+ "lstrip": false,
1644
+ "normalized": false,
1645
+ "rstrip": false,
1646
+ "single_word": false
1647
+ },
1648
+ {
1649
+ "content": "VBR",
1650
+ "lstrip": false,
1651
+ "normalized": false,
1652
+ "rstrip": false,
1653
+ "single_word": false
1654
+ },
1655
+ {
1656
+ "content": "VCPU",
1657
+ "lstrip": false,
1658
+ "normalized": false,
1659
+ "rstrip": false,
1660
+ "single_word": false
1661
+ },
1662
+ {
1663
+ "content": "VI",
1664
+ "lstrip": false,
1665
+ "normalized": false,
1666
+ "rstrip": false,
1667
+ "single_word": false
1668
+ },
1669
+ {
1670
+ "content": "VIC",
1671
+ "lstrip": false,
1672
+ "normalized": false,
1673
+ "rstrip": false,
1674
+ "single_word": false
1675
+ },
1676
+ {
1677
+ "content": "VMEM",
1678
+ "lstrip": false,
1679
+ "normalized": false,
1680
+ "rstrip": false,
1681
+ "single_word": false
1682
+ },
1683
+ {
1684
+ "content": "VMID",
1685
+ "lstrip": false,
1686
+ "normalized": false,
1687
+ "rstrip": false,
1688
+ "single_word": false
1689
+ },
1690
+ {
1691
+ "content": "VPU",
1692
+ "lstrip": false,
1693
+ "normalized": false,
1694
+ "rstrip": false,
1695
+ "single_word": false
1696
+ },
1697
+ {
1698
+ "content": "VRC",
1699
+ "lstrip": false,
1700
+ "normalized": false,
1701
+ "rstrip": false,
1702
+ "single_word": false
1703
+ },
1704
+ {
1705
+ "content": "VUI",
1706
+ "lstrip": false,
1707
+ "normalized": false,
1708
+ "rstrip": false,
1709
+ "single_word": false
1710
+ },
1711
+ {
1712
+ "content": "WARB",
1713
+ "lstrip": false,
1714
+ "normalized": false,
1715
+ "rstrip": false,
1716
+ "single_word": false
1717
+ },
1718
+ {
1719
+ "content": "XIP",
1720
+ "lstrip": false,
1721
+ "normalized": false,
1722
+ "rstrip": false,
1723
+ "single_word": false
1724
+ },
1725
+ {
1726
+ "content": "bpp",
1727
+ "lstrip": false,
1728
+ "normalized": false,
1729
+ "rstrip": false,
1730
+ "single_word": false
1731
+ },
1732
+ {
1733
+ "content": "eMMC",
1734
+ "lstrip": false,
1735
+ "normalized": false,
1736
+ "rstrip": false,
1737
+ "single_word": false
1738
+ },
1739
+ {
1740
+ "content": "hfPLA",
1741
+ "lstrip": false,
1742
+ "normalized": false,
1743
+ "rstrip": false,
1744
+ "single_word": false
1745
+ },
1746
+ {
1747
+ "content": "iGPU",
1748
+ "lstrip": false,
1749
+ "normalized": false,
1750
+ "rstrip": false,
1751
+ "single_word": false
1752
+ },
1753
+ {
1754
+ "content": "ipc",
1755
+ "lstrip": false,
1756
+ "normalized": false,
1757
+ "rstrip": false,
1758
+ "single_word": false
1759
+ },
1760
+ {
1761
+ "content": "ipc_fg",
1762
+ "lstrip": false,
1763
+ "normalized": false,
1764
+ "rstrip": false,
1765
+ "single_word": false
1766
+ },
1767
+ {
1768
+ "content": "ipc_t",
1769
+ "lstrip": false,
1770
+ "normalized": false,
1771
+ "rstrip": false,
1772
+ "single_word": false
1773
+ },
1774
+ {
1775
+ "content": "sbPLA",
1776
+ "lstrip": false,
1777
+ "normalized": false,
1778
+ "rstrip": false,
1779
+ "single_word": false
1780
+ },
1781
+ {
1782
+ "content": "xBTV",
1783
+ "lstrip": false,
1784
+ "normalized": false,
1785
+ "rstrip": false,
1786
+ "single_word": false
1787
+ },
1788
+ {
1789
+ "content": "xps",
1790
+ "lstrip": false,
1791
+ "normalized": false,
1792
+ "rstrip": false,
1793
+ "single_word": false
1794
+ }
1795
+ ],
1796
+ "bos_token": {
1797
+ "content": "<|startoftext|>",
1798
+ "lstrip": false,
1799
+ "normalized": false,
1800
+ "rstrip": false,
1801
+ "single_word": false
1802
+ },
1803
+ "eos_token": {
1804
+ "content": "<|return|>",
1805
+ "lstrip": false,
1806
+ "normalized": false,
1807
+ "rstrip": false,
1808
+ "single_word": false
1809
+ },
1810
+ "pad_token": {
1811
+ "content": "<|endoftext|>",
1812
+ "lstrip": false,
1813
+ "normalized": false,
1814
+ "rstrip": false,
1815
+ "single_word": false
1816
+ }
1817
+ }
checkpoint-3284/tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ec3af79eb37b392bb5382bfe3f4eeab633498c220a804f4fd5d7d102a000f1a
3
+ size 27914312
checkpoint-3284/tokenizer_config.json ADDED
@@ -0,0 +1,2489 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "1529": {
4
+ "content": "SE",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "2022": {
12
+ "content": "IC",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2416": {
20
+ "content": "AD",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3360": {
28
+ "content": "OS",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "4478": {
36
+ "content": "IV",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ },
43
+ "5173": {
44
+ "content": "PL",
45
+ "lstrip": false,
46
+ "normalized": false,
47
+ "rstrip": false,
48
+ "single_word": false,
49
+ "special": true
50
+ },
51
+ "6258": {
52
+ "content": "IST",
53
+ "lstrip": false,
54
+ "normalized": false,
55
+ "rstrip": false,
56
+ "single_word": false,
57
+ "special": true
58
+ },
59
+ "6781": {
60
+ "content": "CA",
61
+ "lstrip": false,
62
+ "normalized": false,
63
+ "rstrip": false,
64
+ "single_word": false,
65
+ "special": true
66
+ },
67
+ "7726": {
68
+ "content": "FO",
69
+ "lstrip": false,
70
+ "normalized": false,
71
+ "rstrip": false,
72
+ "single_word": false,
73
+ "special": true
74
+ },
75
+ "9375": {
76
+ "content": "REE",
77
+ "lstrip": false,
78
+ "normalized": false,
79
+ "rstrip": false,
80
+ "single_word": false,
81
+ "special": true
82
+ },
83
+ "9760": {
84
+ "content": "EC",
85
+ "lstrip": false,
86
+ "normalized": false,
87
+ "rstrip": false,
88
+ "single_word": false,
89
+ "special": true
90
+ },
91
+ "10227": {
92
+ "content": "TA",
93
+ "lstrip": false,
94
+ "normalized": false,
95
+ "rstrip": false,
96
+ "single_word": false,
97
+ "special": true
98
+ },
99
+ "11720": {
100
+ "content": "LIC",
101
+ "lstrip": false,
102
+ "normalized": false,
103
+ "rstrip": false,
104
+ "single_word": false,
105
+ "special": true
106
+ },
107
+ "12235": {
108
+ "content": "NT",
109
+ "lstrip": false,
110
+ "normalized": false,
111
+ "rstrip": false,
112
+ "single_word": false,
113
+ "special": true
114
+ },
115
+ "12515": {
116
+ "content": "RC",
117
+ "lstrip": false,
118
+ "normalized": false,
119
+ "rstrip": false,
120
+ "single_word": false,
121
+ "special": true
122
+ },
123
+ "13874": {
124
+ "content": "MB",
125
+ "lstrip": false,
126
+ "normalized": false,
127
+ "rstrip": false,
128
+ "single_word": false,
129
+ "special": true
130
+ },
131
+ "13905": {
132
+ "content": "GR",
133
+ "lstrip": false,
134
+ "normalized": false,
135
+ "rstrip": false,
136
+ "single_word": false,
137
+ "special": true
138
+ },
139
+ "15409": {
140
+ "content": "DU",
141
+ "lstrip": false,
142
+ "normalized": false,
143
+ "rstrip": false,
144
+ "single_word": false,
145
+ "special": true
146
+ },
147
+ "17183": {
148
+ "content": "DT",
149
+ "lstrip": false,
150
+ "normalized": false,
151
+ "rstrip": false,
152
+ "single_word": false,
153
+ "special": true
154
+ },
155
+ "19862": {
156
+ "content": "SO",
157
+ "lstrip": false,
158
+ "normalized": false,
159
+ "rstrip": false,
160
+ "single_word": false,
161
+ "special": true
162
+ },
163
+ "20174": {
164
+ "content": "FP",
165
+ "lstrip": false,
166
+ "normalized": false,
167
+ "rstrip": false,
168
+ "single_word": false,
169
+ "special": true
170
+ },
171
+ "22723": {
172
+ "content": "VI",
173
+ "lstrip": false,
174
+ "normalized": false,
175
+ "rstrip": false,
176
+ "single_word": false,
177
+ "special": true
178
+ },
179
+ "27968": {
180
+ "content": "SW",
181
+ "lstrip": false,
182
+ "normalized": false,
183
+ "rstrip": false,
184
+ "single_word": false,
185
+ "special": true
186
+ },
187
+ "29829": {
188
+ "content": "CV",
189
+ "lstrip": false,
190
+ "normalized": false,
191
+ "rstrip": false,
192
+ "single_word": false,
193
+ "special": true
194
+ },
195
+ "29864": {
196
+ "content": "GP",
197
+ "lstrip": false,
198
+ "normalized": false,
199
+ "rstrip": false,
200
+ "single_word": false,
201
+ "special": true
202
+ },
203
+ "34134": {
204
+ "content": "ILD",
205
+ "lstrip": false,
206
+ "normalized": false,
207
+ "rstrip": false,
208
+ "single_word": false,
209
+ "special": true
210
+ },
211
+ "34435": {
212
+ "content": "FW",
213
+ "lstrip": false,
214
+ "normalized": false,
215
+ "rstrip": false,
216
+ "single_word": false,
217
+ "special": true
218
+ },
219
+ "39749": {
220
+ "content": "TRL",
221
+ "lstrip": false,
222
+ "normalized": false,
223
+ "rstrip": false,
224
+ "single_word": false,
225
+ "special": true
226
+ },
227
+ "43230": {
228
+ "content": "LAB",
229
+ "lstrip": false,
230
+ "normalized": false,
231
+ "rstrip": false,
232
+ "single_word": false,
233
+ "special": true
234
+ },
235
+ "46966": {
236
+ "content": "SDK",
237
+ "lstrip": false,
238
+ "normalized": false,
239
+ "rstrip": false,
240
+ "single_word": false,
241
+ "special": true
242
+ },
243
+ "47787": {
244
+ "content": "CPU",
245
+ "lstrip": false,
246
+ "normalized": false,
247
+ "rstrip": false,
248
+ "single_word": false,
249
+ "special": true
250
+ },
251
+ "47994": {
252
+ "content": "MAC",
253
+ "lstrip": false,
254
+ "normalized": false,
255
+ "rstrip": false,
256
+ "single_word": false,
257
+ "special": true
258
+ },
259
+ "50719": {
260
+ "content": "IAS",
261
+ "lstrip": false,
262
+ "normalized": false,
263
+ "rstrip": false,
264
+ "single_word": false,
265
+ "special": true
266
+ },
267
+ "52907": {
268
+ "content": "CAR",
269
+ "lstrip": false,
270
+ "normalized": false,
271
+ "rstrip": false,
272
+ "single_word": false,
273
+ "special": true
274
+ },
275
+ "54793": {
276
+ "content": "EOF",
277
+ "lstrip": false,
278
+ "normalized": false,
279
+ "rstrip": false,
280
+ "single_word": false,
281
+ "special": true
282
+ },
283
+ "58530": {
284
+ "content": "PB",
285
+ "lstrip": false,
286
+ "normalized": false,
287
+ "rstrip": false,
288
+ "single_word": false,
289
+ "special": true
290
+ },
291
+ "66773": {
292
+ "content": "DEV",
293
+ "lstrip": false,
294
+ "normalized": false,
295
+ "rstrip": false,
296
+ "single_word": false,
297
+ "special": true
298
+ },
299
+ "68495": {
300
+ "content": "HW",
301
+ "lstrip": false,
302
+ "normalized": false,
303
+ "rstrip": false,
304
+ "single_word": false,
305
+ "special": true
306
+ },
307
+ "70684": {
308
+ "content": "SHA",
309
+ "lstrip": false,
310
+ "normalized": false,
311
+ "rstrip": false,
312
+ "single_word": false,
313
+ "special": true
314
+ },
315
+ "72089": {
316
+ "content": "SKU",
317
+ "lstrip": false,
318
+ "normalized": false,
319
+ "rstrip": false,
320
+ "single_word": false,
321
+ "special": true
322
+ },
323
+ "74923": {
324
+ "content": "CAN",
325
+ "lstrip": false,
326
+ "normalized": false,
327
+ "rstrip": false,
328
+ "single_word": false,
329
+ "special": true
330
+ },
331
+ "77411": {
332
+ "content": "AKE",
333
+ "lstrip": false,
334
+ "normalized": false,
335
+ "rstrip": false,
336
+ "single_word": false,
337
+ "special": true
338
+ },
339
+ "81990": {
340
+ "content": "DEP",
341
+ "lstrip": false,
342
+ "normalized": false,
343
+ "rstrip": false,
344
+ "single_word": false,
345
+ "special": true
346
+ },
347
+ "82244": {
348
+ "content": "GPU",
349
+ "lstrip": false,
350
+ "normalized": false,
351
+ "rstrip": false,
352
+ "single_word": false,
353
+ "special": true
354
+ },
355
+ "84526": {
356
+ "content": "POR",
357
+ "lstrip": false,
358
+ "normalized": false,
359
+ "rstrip": false,
360
+ "single_word": false,
361
+ "special": true
362
+ },
363
+ "86154": {
364
+ "content": "IID",
365
+ "lstrip": false,
366
+ "normalized": false,
367
+ "rstrip": false,
368
+ "single_word": false,
369
+ "special": true
370
+ },
371
+ "86297": {
372
+ "content": "CSI",
373
+ "lstrip": false,
374
+ "normalized": false,
375
+ "rstrip": false,
376
+ "single_word": false,
377
+ "special": true
378
+ },
379
+ "93660": {
380
+ "content": "ACL",
381
+ "lstrip": false,
382
+ "normalized": false,
383
+ "rstrip": false,
384
+ "single_word": false,
385
+ "special": true
386
+ },
387
+ "94432": {
388
+ "content": "TZ",
389
+ "lstrip": false,
390
+ "normalized": false,
391
+ "rstrip": false,
392
+ "single_word": false,
393
+ "special": true
394
+ },
395
+ "95202": {
396
+ "content": "SQ",
397
+ "lstrip": false,
398
+ "normalized": false,
399
+ "rstrip": false,
400
+ "single_word": false,
401
+ "special": true
402
+ },
403
+ "100413": {
404
+ "content": "PSC",
405
+ "lstrip": false,
406
+ "normalized": false,
407
+ "rstrip": false,
408
+ "single_word": false,
409
+ "special": true
410
+ },
411
+ "104755": {
412
+ "content": "DMA",
413
+ "lstrip": false,
414
+ "normalized": false,
415
+ "rstrip": false,
416
+ "single_word": false,
417
+ "special": true
418
+ },
419
+ "104805": {
420
+ "content": "BW",
421
+ "lstrip": false,
422
+ "normalized": false,
423
+ "rstrip": false,
424
+ "single_word": false,
425
+ "special": true
426
+ },
427
+ "106979": {
428
+ "content": "OTP",
429
+ "lstrip": false,
430
+ "normalized": false,
431
+ "rstrip": false,
432
+ "single_word": false,
433
+ "special": true
434
+ },
435
+ "110871": {
436
+ "content": "CRC",
437
+ "lstrip": false,
438
+ "normalized": false,
439
+ "rstrip": false,
440
+ "single_word": false,
441
+ "special": true
442
+ },
443
+ "117565": {
444
+ "content": "FPS",
445
+ "lstrip": false,
446
+ "normalized": false,
447
+ "rstrip": false,
448
+ "single_word": false,
449
+ "special": true
450
+ },
451
+ "118754": {
452
+ "content": "IPC",
453
+ "lstrip": false,
454
+ "normalized": false,
455
+ "rstrip": false,
456
+ "single_word": false,
457
+ "special": true
458
+ },
459
+ "126731": {
460
+ "content": "OEM",
461
+ "lstrip": false,
462
+ "normalized": false,
463
+ "rstrip": false,
464
+ "single_word": false,
465
+ "special": true
466
+ },
467
+ "126978": {
468
+ "content": "AES",
469
+ "lstrip": false,
470
+ "normalized": false,
471
+ "rstrip": false,
472
+ "single_word": false,
473
+ "special": true
474
+ },
475
+ "130911": {
476
+ "content": "RSA",
477
+ "lstrip": false,
478
+ "normalized": false,
479
+ "rstrip": false,
480
+ "single_word": false,
481
+ "special": true
482
+ },
483
+ "147130": {
484
+ "content": "CTR",
485
+ "lstrip": false,
486
+ "normalized": false,
487
+ "rstrip": false,
488
+ "single_word": false,
489
+ "special": true
490
+ },
491
+ "151336": {
492
+ "content": "OSP",
493
+ "lstrip": false,
494
+ "normalized": false,
495
+ "rstrip": false,
496
+ "single_word": false,
497
+ "special": true
498
+ },
499
+ "152076": {
500
+ "content": "IOC",
501
+ "lstrip": false,
502
+ "normalized": false,
503
+ "rstrip": false,
504
+ "single_word": false,
505
+ "special": true
506
+ },
507
+ "152095": {
508
+ "content": "SPA",
509
+ "lstrip": false,
510
+ "normalized": false,
511
+ "rstrip": false,
512
+ "single_word": false,
513
+ "special": true
514
+ },
515
+ "152119": {
516
+ "content": "CDD",
517
+ "lstrip": false,
518
+ "normalized": false,
519
+ "rstrip": false,
520
+ "single_word": false,
521
+ "special": true
522
+ },
523
+ "155474": {
524
+ "content": "SCH",
525
+ "lstrip": false,
526
+ "normalized": false,
527
+ "rstrip": false,
528
+ "single_word": false,
529
+ "special": true
530
+ },
531
+ "158359": {
532
+ "content": "ipc",
533
+ "lstrip": false,
534
+ "normalized": false,
535
+ "rstrip": false,
536
+ "single_word": false,
537
+ "special": true
538
+ },
539
+ "162121": {
540
+ "content": "PLA",
541
+ "lstrip": false,
542
+ "normalized": false,
543
+ "rstrip": false,
544
+ "single_word": false,
545
+ "special": true
546
+ },
547
+ "166996": {
548
+ "content": "CBC",
549
+ "lstrip": false,
550
+ "normalized": false,
551
+ "rstrip": false,
552
+ "single_word": false,
553
+ "special": true
554
+ },
555
+ "171893": {
556
+ "content": "DISPLAY",
557
+ "lstrip": false,
558
+ "normalized": false,
559
+ "rstrip": false,
560
+ "single_word": false,
561
+ "special": true
562
+ },
563
+ "172873": {
564
+ "content": "AAD",
565
+ "lstrip": false,
566
+ "normalized": false,
567
+ "rstrip": false,
568
+ "single_word": false,
569
+ "special": true
570
+ },
571
+ "175772": {
572
+ "content": "TEE",
573
+ "lstrip": false,
574
+ "normalized": false,
575
+ "rstrip": false,
576
+ "single_word": false,
577
+ "special": true
578
+ },
579
+ "177970": {
580
+ "content": "ECB",
581
+ "lstrip": false,
582
+ "normalized": false,
583
+ "rstrip": false,
584
+ "single_word": false,
585
+ "special": true
586
+ },
587
+ "178261": {
588
+ "content": "ECC",
589
+ "lstrip": false,
590
+ "normalized": false,
591
+ "rstrip": false,
592
+ "single_word": false,
593
+ "special": true
594
+ },
595
+ "178974": {
596
+ "content": "PCR",
597
+ "lstrip": false,
598
+ "normalized": false,
599
+ "rstrip": false,
600
+ "single_word": false,
601
+ "special": true
602
+ },
603
+ "186075": {
604
+ "content": "IPI",
605
+ "lstrip": false,
606
+ "normalized": false,
607
+ "rstrip": false,
608
+ "single_word": false,
609
+ "special": true
610
+ },
611
+ "187697": {
612
+ "content": "SSR",
613
+ "lstrip": false,
614
+ "normalized": false,
615
+ "rstrip": false,
616
+ "single_word": false,
617
+ "special": true
618
+ },
619
+ "199998": {
620
+ "content": "<|startoftext|>",
621
+ "lstrip": false,
622
+ "normalized": false,
623
+ "rstrip": false,
624
+ "single_word": false,
625
+ "special": true
626
+ },
627
+ "199999": {
628
+ "content": "<|endoftext|>",
629
+ "lstrip": false,
630
+ "normalized": false,
631
+ "rstrip": false,
632
+ "single_word": false,
633
+ "special": true
634
+ },
635
+ "200000": {
636
+ "content": "<|reserved_200000|>",
637
+ "lstrip": false,
638
+ "normalized": false,
639
+ "rstrip": false,
640
+ "single_word": false,
641
+ "special": true
642
+ },
643
+ "200001": {
644
+ "content": "<|reserved_200001|>",
645
+ "lstrip": false,
646
+ "normalized": false,
647
+ "rstrip": false,
648
+ "single_word": false,
649
+ "special": true
650
+ },
651
+ "200002": {
652
+ "content": "<|return|>",
653
+ "lstrip": false,
654
+ "normalized": false,
655
+ "rstrip": false,
656
+ "single_word": false,
657
+ "special": true
658
+ },
659
+ "200003": {
660
+ "content": "<|constrain|>",
661
+ "lstrip": false,
662
+ "normalized": false,
663
+ "rstrip": false,
664
+ "single_word": false,
665
+ "special": true
666
+ },
667
+ "200004": {
668
+ "content": "<|reserved_200004|>",
669
+ "lstrip": false,
670
+ "normalized": false,
671
+ "rstrip": false,
672
+ "single_word": false,
673
+ "special": true
674
+ },
675
+ "200005": {
676
+ "content": "<|channel|>",
677
+ "lstrip": false,
678
+ "normalized": false,
679
+ "rstrip": false,
680
+ "single_word": false,
681
+ "special": true
682
+ },
683
+ "200006": {
684
+ "content": "<|start|>",
685
+ "lstrip": false,
686
+ "normalized": false,
687
+ "rstrip": false,
688
+ "single_word": false,
689
+ "special": true
690
+ },
691
+ "200007": {
692
+ "content": "<|end|>",
693
+ "lstrip": false,
694
+ "normalized": false,
695
+ "rstrip": false,
696
+ "single_word": false,
697
+ "special": true
698
+ },
699
+ "200008": {
700
+ "content": "<|message|>",
701
+ "lstrip": false,
702
+ "normalized": false,
703
+ "rstrip": false,
704
+ "single_word": false,
705
+ "special": true
706
+ },
707
+ "200009": {
708
+ "content": "<|reserved_200009|>",
709
+ "lstrip": false,
710
+ "normalized": false,
711
+ "rstrip": false,
712
+ "single_word": false,
713
+ "special": true
714
+ },
715
+ "200010": {
716
+ "content": "<|reserved_200010|>",
717
+ "lstrip": false,
718
+ "normalized": false,
719
+ "rstrip": false,
720
+ "single_word": false,
721
+ "special": true
722
+ },
723
+ "200011": {
724
+ "content": "<|reserved_200011|>",
725
+ "lstrip": false,
726
+ "normalized": false,
727
+ "rstrip": false,
728
+ "single_word": false,
729
+ "special": true
730
+ },
731
+ "200012": {
732
+ "content": "<|call|>",
733
+ "lstrip": false,
734
+ "normalized": false,
735
+ "rstrip": false,
736
+ "single_word": false,
737
+ "special": true
738
+ },
739
+ "200013": {
740
+ "content": "<|reserved_200013|>",
741
+ "lstrip": false,
742
+ "normalized": false,
743
+ "rstrip": false,
744
+ "single_word": false,
745
+ "special": true
746
+ },
747
+ "200014": {
748
+ "content": "<|reserved_200014|>",
749
+ "lstrip": false,
750
+ "normalized": false,
751
+ "rstrip": false,
752
+ "single_word": false,
753
+ "special": true
754
+ },
755
+ "200015": {
756
+ "content": "<|reserved_200015|>",
757
+ "lstrip": false,
758
+ "normalized": false,
759
+ "rstrip": false,
760
+ "single_word": false,
761
+ "special": true
762
+ },
763
+ "200016": {
764
+ "content": "<|reserved_200016|>",
765
+ "lstrip": false,
766
+ "normalized": false,
767
+ "rstrip": false,
768
+ "single_word": false,
769
+ "special": true
770
+ },
771
+ "200017": {
772
+ "content": "<|reserved_200017|>",
773
+ "lstrip": false,
774
+ "normalized": false,
775
+ "rstrip": false,
776
+ "single_word": false,
777
+ "special": true
778
+ },
779
+ "200018": {
780
+ "content": "<|endofprompt|>",
781
+ "lstrip": false,
782
+ "normalized": false,
783
+ "rstrip": false,
784
+ "single_word": false,
785
+ "special": true
786
+ },
787
+ "200019": {
788
+ "content": "AArch64",
789
+ "lstrip": false,
790
+ "normalized": false,
791
+ "rstrip": false,
792
+ "single_word": false,
793
+ "special": true
794
+ },
795
+ "200020": {
796
+ "content": "AES256GCM",
797
+ "lstrip": false,
798
+ "normalized": false,
799
+ "rstrip": false,
800
+ "single_word": false,
801
+ "special": true
802
+ },
803
+ "200021": {
804
+ "content": "AESCBC",
805
+ "lstrip": false,
806
+ "normalized": false,
807
+ "rstrip": false,
808
+ "single_word": false,
809
+ "special": true
810
+ },
811
+ "200022": {
812
+ "content": "AON",
813
+ "lstrip": false,
814
+ "normalized": false,
815
+ "rstrip": false,
816
+ "single_word": false,
817
+ "special": true
818
+ },
819
+ "200023": {
820
+ "content": "ASID",
821
+ "lstrip": false,
822
+ "normalized": false,
823
+ "rstrip": false,
824
+ "single_word": false,
825
+ "special": true
826
+ },
827
+ "200024": {
828
+ "content": "AXI",
829
+ "lstrip": false,
830
+ "normalized": false,
831
+ "rstrip": false,
832
+ "single_word": false,
833
+ "special": true
834
+ },
835
+ "200025": {
836
+ "content": "Acronym",
837
+ "lstrip": false,
838
+ "normalized": false,
839
+ "rstrip": false,
840
+ "single_word": false,
841
+ "special": true
842
+ },
843
+ "200026": {
844
+ "content": "AoU",
845
+ "lstrip": false,
846
+ "normalized": false,
847
+ "rstrip": false,
848
+ "single_word": false,
849
+ "special": true
850
+ },
851
+ "200027": {
852
+ "content": "AutoSar",
853
+ "lstrip": false,
854
+ "normalized": false,
855
+ "rstrip": false,
856
+ "single_word": false,
857
+ "special": true
858
+ },
859
+ "200028": {
860
+ "content": "BAM",
861
+ "lstrip": false,
862
+ "normalized": false,
863
+ "rstrip": false,
864
+ "single_word": false,
865
+ "special": true
866
+ },
867
+ "200029": {
868
+ "content": "BCH",
869
+ "lstrip": false,
870
+ "normalized": false,
871
+ "rstrip": false,
872
+ "single_word": false,
873
+ "special": true
874
+ },
875
+ "200030": {
876
+ "content": "BIST",
877
+ "lstrip": false,
878
+ "normalized": false,
879
+ "rstrip": false,
880
+ "single_word": false,
881
+ "special": true
882
+ },
883
+ "200031": {
884
+ "content": "BOM",
885
+ "lstrip": false,
886
+ "normalized": false,
887
+ "rstrip": false,
888
+ "single_word": false,
889
+ "special": true
890
+ },
891
+ "200032": {
892
+ "content": "BPMP",
893
+ "lstrip": false,
894
+ "normalized": false,
895
+ "rstrip": false,
896
+ "single_word": false,
897
+ "special": true
898
+ },
899
+ "200033": {
900
+ "content": "BPS",
901
+ "lstrip": false,
902
+ "normalized": false,
903
+ "rstrip": false,
904
+ "single_word": false,
905
+ "special": true
906
+ },
907
+ "200034": {
908
+ "content": "BPU",
909
+ "lstrip": false,
910
+ "normalized": false,
911
+ "rstrip": false,
912
+ "single_word": false,
913
+ "special": true
914
+ },
915
+ "200035": {
916
+ "content": "BRBCT",
917
+ "lstrip": false,
918
+ "normalized": false,
919
+ "rstrip": false,
920
+ "single_word": false,
921
+ "special": true
922
+ },
923
+ "200036": {
924
+ "content": "C2C",
925
+ "lstrip": false,
926
+ "normalized": false,
927
+ "rstrip": false,
928
+ "single_word": false,
929
+ "special": true
930
+ },
931
+ "200037": {
932
+ "content": "CANFD",
933
+ "lstrip": false,
934
+ "normalized": false,
935
+ "rstrip": false,
936
+ "single_word": false,
937
+ "special": true
938
+ },
939
+ "200038": {
940
+ "content": "CAVP",
941
+ "lstrip": false,
942
+ "normalized": false,
943
+ "rstrip": false,
944
+ "single_word": false,
945
+ "special": true
946
+ },
947
+ "200039": {
948
+ "content": "CBB",
949
+ "lstrip": false,
950
+ "normalized": false,
951
+ "rstrip": false,
952
+ "single_word": false,
953
+ "special": true
954
+ },
955
+ "200040": {
956
+ "content": "CBR",
957
+ "lstrip": false,
958
+ "normalized": false,
959
+ "rstrip": false,
960
+ "single_word": false,
961
+ "special": true
962
+ },
963
+ "200041": {
964
+ "content": "CCM",
965
+ "lstrip": false,
966
+ "normalized": false,
967
+ "rstrip": false,
968
+ "single_word": false,
969
+ "special": true
970
+ },
971
+ "200042": {
972
+ "content": "CCPLEX",
973
+ "lstrip": false,
974
+ "normalized": false,
975
+ "rstrip": false,
976
+ "single_word": false,
977
+ "special": true
978
+ },
979
+ "200043": {
980
+ "content": "CCPLEX_L2",
981
+ "lstrip": false,
982
+ "normalized": false,
983
+ "rstrip": false,
984
+ "single_word": false,
985
+ "special": true
986
+ },
987
+ "200044": {
988
+ "content": "CCPLEX_MISC",
989
+ "lstrip": false,
990
+ "normalized": false,
991
+ "rstrip": false,
992
+ "single_word": false,
993
+ "special": true
994
+ },
995
+ "200045": {
996
+ "content": "CCPLEX_SCF",
997
+ "lstrip": false,
998
+ "normalized": false,
999
+ "rstrip": false,
1000
+ "single_word": false,
1001
+ "special": true
1002
+ },
1003
+ "200046": {
1004
+ "content": "CIF",
1005
+ "lstrip": false,
1006
+ "normalized": false,
1007
+ "rstrip": false,
1008
+ "single_word": false,
1009
+ "special": true
1010
+ },
1011
+ "200047": {
1012
+ "content": "CMAC",
1013
+ "lstrip": false,
1014
+ "normalized": false,
1015
+ "rstrip": false,
1016
+ "single_word": false,
1017
+ "special": true
1018
+ },
1019
+ "200048": {
1020
+ "content": "CPE",
1021
+ "lstrip": false,
1022
+ "normalized": false,
1023
+ "rstrip": false,
1024
+ "single_word": false,
1025
+ "special": true
1026
+ },
1027
+ "200049": {
1028
+ "content": "CSP",
1029
+ "lstrip": false,
1030
+ "normalized": false,
1031
+ "rstrip": false,
1032
+ "single_word": false,
1033
+ "special": true
1034
+ },
1035
+ "200050": {
1036
+ "content": "CTXT",
1037
+ "lstrip": false,
1038
+ "normalized": false,
1039
+ "rstrip": false,
1040
+ "single_word": false,
1041
+ "special": true
1042
+ },
1043
+ "200051": {
1044
+ "content": "DBB",
1045
+ "lstrip": false,
1046
+ "normalized": false,
1047
+ "rstrip": false,
1048
+ "single_word": false,
1049
+ "special": true
1050
+ },
1051
+ "200052": {
1052
+ "content": "DFA",
1053
+ "lstrip": false,
1054
+ "normalized": false,
1055
+ "rstrip": false,
1056
+ "single_word": false,
1057
+ "special": true
1058
+ },
1059
+ "200053": {
1060
+ "content": "DFT",
1061
+ "lstrip": false,
1062
+ "normalized": false,
1063
+ "rstrip": false,
1064
+ "single_word": false,
1065
+ "special": true
1066
+ },
1067
+ "200054": {
1068
+ "content": "DIP",
1069
+ "lstrip": false,
1070
+ "normalized": false,
1071
+ "rstrip": false,
1072
+ "single_word": false,
1073
+ "special": true
1074
+ },
1075
+ "200055": {
1076
+ "content": "DLA",
1077
+ "lstrip": false,
1078
+ "normalized": false,
1079
+ "rstrip": false,
1080
+ "single_word": false,
1081
+ "special": true
1082
+ },
1083
+ "200056": {
1084
+ "content": "DMEM",
1085
+ "lstrip": false,
1086
+ "normalized": false,
1087
+ "rstrip": false,
1088
+ "single_word": false,
1089
+ "special": true
1090
+ },
1091
+ "200057": {
1092
+ "content": "DPA",
1093
+ "lstrip": false,
1094
+ "normalized": false,
1095
+ "rstrip": false,
1096
+ "single_word": false,
1097
+ "special": true
1098
+ },
1099
+ "200058": {
1100
+ "content": "DSC",
1101
+ "lstrip": false,
1102
+ "normalized": false,
1103
+ "rstrip": false,
1104
+ "single_word": false,
1105
+ "special": true
1106
+ },
1107
+ "200059": {
1108
+ "content": "DVMU",
1109
+ "lstrip": false,
1110
+ "normalized": false,
1111
+ "rstrip": false,
1112
+ "single_word": false,
1113
+ "special": true
1114
+ },
1115
+ "200060": {
1116
+ "content": "ECDHE",
1117
+ "lstrip": false,
1118
+ "normalized": false,
1119
+ "rstrip": false,
1120
+ "single_word": false,
1121
+ "special": true
1122
+ },
1123
+ "200061": {
1124
+ "content": "ECDSA",
1125
+ "lstrip": false,
1126
+ "normalized": false,
1127
+ "rstrip": false,
1128
+ "single_word": false,
1129
+ "special": true
1130
+ },
1131
+ "200062": {
1132
+ "content": "ECID",
1133
+ "lstrip": false,
1134
+ "normalized": false,
1135
+ "rstrip": false,
1136
+ "single_word": false,
1137
+ "special": true
1138
+ },
1139
+ "200063": {
1140
+ "content": "EDR",
1141
+ "lstrip": false,
1142
+ "normalized": false,
1143
+ "rstrip": false,
1144
+ "single_word": false,
1145
+ "special": true
1146
+ },
1147
+ "200064": {
1148
+ "content": "EOTTI",
1149
+ "lstrip": false,
1150
+ "normalized": false,
1151
+ "rstrip": false,
1152
+ "single_word": false,
1153
+ "special": true
1154
+ },
1155
+ "200065": {
1156
+ "content": "EQoS",
1157
+ "lstrip": false,
1158
+ "normalized": false,
1159
+ "rstrip": false,
1160
+ "single_word": false,
1161
+ "special": true
1162
+ },
1163
+ "200066": {
1164
+ "content": "FCL",
1165
+ "lstrip": false,
1166
+ "normalized": false,
1167
+ "rstrip": false,
1168
+ "single_word": false,
1169
+ "special": true
1170
+ },
1171
+ "200067": {
1172
+ "content": "FHTI",
1173
+ "lstrip": false,
1174
+ "normalized": false,
1175
+ "rstrip": false,
1176
+ "single_word": false,
1177
+ "special": true
1178
+ },
1179
+ "200068": {
1180
+ "content": "FIPS",
1181
+ "lstrip": false,
1182
+ "normalized": false,
1183
+ "rstrip": false,
1184
+ "single_word": false,
1185
+ "special": true
1186
+ },
1187
+ "200069": {
1188
+ "content": "FMEA",
1189
+ "lstrip": false,
1190
+ "normalized": false,
1191
+ "rstrip": false,
1192
+ "single_word": false,
1193
+ "special": true
1194
+ },
1195
+ "200070": {
1196
+ "content": "FMON",
1197
+ "lstrip": false,
1198
+ "normalized": false,
1199
+ "rstrip": false,
1200
+ "single_word": false,
1201
+ "special": true
1202
+ },
1203
+ "200071": {
1204
+ "content": "FuSa",
1205
+ "lstrip": false,
1206
+ "normalized": false,
1207
+ "rstrip": false,
1208
+ "single_word": false,
1209
+ "special": true
1210
+ },
1211
+ "200072": {
1212
+ "content": "GCM",
1213
+ "lstrip": false,
1214
+ "normalized": false,
1215
+ "rstrip": false,
1216
+ "single_word": false,
1217
+ "special": true
1218
+ },
1219
+ "200073": {
1220
+ "content": "GFD",
1221
+ "lstrip": false,
1222
+ "normalized": false,
1223
+ "rstrip": false,
1224
+ "single_word": false,
1225
+ "special": true
1226
+ },
1227
+ "200074": {
1228
+ "content": "GIC",
1229
+ "lstrip": false,
1230
+ "normalized": false,
1231
+ "rstrip": false,
1232
+ "single_word": false,
1233
+ "special": true
1234
+ },
1235
+ "200075": {
1236
+ "content": "GMAC",
1237
+ "lstrip": false,
1238
+ "normalized": false,
1239
+ "rstrip": false,
1240
+ "single_word": false,
1241
+ "special": true
1242
+ },
1243
+ "200076": {
1244
+ "content": "GMSL",
1245
+ "lstrip": false,
1246
+ "normalized": false,
1247
+ "rstrip": false,
1248
+ "single_word": false,
1249
+ "special": true
1250
+ },
1251
+ "200077": {
1252
+ "content": "GOP",
1253
+ "lstrip": false,
1254
+ "normalized": false,
1255
+ "rstrip": false,
1256
+ "single_word": false,
1257
+ "special": true
1258
+ },
1259
+ "200078": {
1260
+ "content": "GPCDMA",
1261
+ "lstrip": false,
1262
+ "normalized": false,
1263
+ "rstrip": false,
1264
+ "single_word": false,
1265
+ "special": true
1266
+ },
1267
+ "200079": {
1268
+ "content": "Gpps",
1269
+ "lstrip": false,
1270
+ "normalized": false,
1271
+ "rstrip": false,
1272
+ "single_word": false,
1273
+ "special": true
1274
+ },
1275
+ "200080": {
1276
+ "content": "HBR",
1277
+ "lstrip": false,
1278
+ "normalized": false,
1279
+ "rstrip": false,
1280
+ "single_word": false,
1281
+ "special": true
1282
+ },
1283
+ "200081": {
1284
+ "content": "HBR2",
1285
+ "lstrip": false,
1286
+ "normalized": false,
1287
+ "rstrip": false,
1288
+ "single_word": false,
1289
+ "special": true
1290
+ },
1291
+ "200082": {
1292
+ "content": "HBR3",
1293
+ "lstrip": false,
1294
+ "normalized": false,
1295
+ "rstrip": false,
1296
+ "single_word": false,
1297
+ "special": true
1298
+ },
1299
+ "200083": {
1300
+ "content": "HDS",
1301
+ "lstrip": false,
1302
+ "normalized": false,
1303
+ "rstrip": false,
1304
+ "single_word": false,
1305
+ "special": true
1306
+ },
1307
+ "200084": {
1308
+ "content": "HIS",
1309
+ "lstrip": false,
1310
+ "normalized": false,
1311
+ "rstrip": false,
1312
+ "single_word": false,
1313
+ "special": true
1314
+ },
1315
+ "200085": {
1316
+ "content": "HMAC",
1317
+ "lstrip": false,
1318
+ "normalized": false,
1319
+ "rstrip": false,
1320
+ "single_word": false,
1321
+ "special": true
1322
+ },
1323
+ "200086": {
1324
+ "content": "HPSE",
1325
+ "lstrip": false,
1326
+ "normalized": false,
1327
+ "rstrip": false,
1328
+ "single_word": false,
1329
+ "special": true
1330
+ },
1331
+ "200087": {
1332
+ "content": "HSI",
1333
+ "lstrip": false,
1334
+ "normalized": false,
1335
+ "rstrip": false,
1336
+ "single_word": false,
1337
+ "special": true
1338
+ },
1339
+ "200088": {
1340
+ "content": "HSM",
1341
+ "lstrip": false,
1342
+ "normalized": false,
1343
+ "rstrip": false,
1344
+ "single_word": false,
1345
+ "special": true
1346
+ },
1347
+ "200089": {
1348
+ "content": "HSP",
1349
+ "lstrip": false,
1350
+ "normalized": false,
1351
+ "rstrip": false,
1352
+ "single_word": false,
1353
+ "special": true
1354
+ },
1355
+ "200090": {
1356
+ "content": "ICD",
1357
+ "lstrip": false,
1358
+ "normalized": false,
1359
+ "rstrip": false,
1360
+ "single_word": false,
1361
+ "special": true
1362
+ },
1363
+ "200091": {
1364
+ "content": "IDR",
1365
+ "lstrip": false,
1366
+ "normalized": false,
1367
+ "rstrip": false,
1368
+ "single_word": false,
1369
+ "special": true
1370
+ },
1371
+ "200092": {
1372
+ "content": "IDT",
1373
+ "lstrip": false,
1374
+ "normalized": false,
1375
+ "rstrip": false,
1376
+ "single_word": false,
1377
+ "special": true
1378
+ },
1379
+ "200093": {
1380
+ "content": "IEP",
1381
+ "lstrip": false,
1382
+ "normalized": false,
1383
+ "rstrip": false,
1384
+ "single_word": false,
1385
+ "special": true
1386
+ },
1387
+ "200094": {
1388
+ "content": "IEU",
1389
+ "lstrip": false,
1390
+ "normalized": false,
1391
+ "rstrip": false,
1392
+ "single_word": false,
1393
+ "special": true
1394
+ },
1395
+ "200095": {
1396
+ "content": "IFU",
1397
+ "lstrip": false,
1398
+ "normalized": false,
1399
+ "rstrip": false,
1400
+ "single_word": false,
1401
+ "special": true
1402
+ },
1403
+ "200096": {
1404
+ "content": "IMEM",
1405
+ "lstrip": false,
1406
+ "normalized": false,
1407
+ "rstrip": false,
1408
+ "single_word": false,
1409
+ "special": true
1410
+ },
1411
+ "200097": {
1412
+ "content": "IOFA",
1413
+ "lstrip": false,
1414
+ "normalized": false,
1415
+ "rstrip": false,
1416
+ "single_word": false,
1417
+ "special": true
1418
+ },
1419
+ "200098": {
1420
+ "content": "IOMMU",
1421
+ "lstrip": false,
1422
+ "normalized": false,
1423
+ "rstrip": false,
1424
+ "single_word": false,
1425
+ "special": true
1426
+ },
1427
+ "200099": {
1428
+ "content": "IRF",
1429
+ "lstrip": false,
1430
+ "normalized": false,
1431
+ "rstrip": false,
1432
+ "single_word": false,
1433
+ "special": true
1434
+ },
1435
+ "200100": {
1436
+ "content": "IoT",
1437
+ "lstrip": false,
1438
+ "normalized": false,
1439
+ "rstrip": false,
1440
+ "single_word": false,
1441
+ "special": true
1442
+ },
1443
+ "200101": {
1444
+ "content": "JSR",
1445
+ "lstrip": false,
1446
+ "normalized": false,
1447
+ "rstrip": false,
1448
+ "single_word": false,
1449
+ "special": true
1450
+ },
1451
+ "200102": {
1452
+ "content": "KAT",
1453
+ "lstrip": false,
1454
+ "normalized": false,
1455
+ "rstrip": false,
1456
+ "single_word": false,
1457
+ "special": true
1458
+ },
1459
+ "200103": {
1460
+ "content": "KCV",
1461
+ "lstrip": false,
1462
+ "normalized": false,
1463
+ "rstrip": false,
1464
+ "single_word": false,
1465
+ "special": true
1466
+ },
1467
+ "200104": {
1468
+ "content": "KDF",
1469
+ "lstrip": false,
1470
+ "normalized": false,
1471
+ "rstrip": false,
1472
+ "single_word": false,
1473
+ "special": true
1474
+ },
1475
+ "200105": {
1476
+ "content": "KPI",
1477
+ "lstrip": false,
1478
+ "normalized": false,
1479
+ "rstrip": false,
1480
+ "single_word": false,
1481
+ "special": true
1482
+ },
1483
+ "200106": {
1484
+ "content": "L1PT",
1485
+ "lstrip": false,
1486
+ "normalized": false,
1487
+ "rstrip": false,
1488
+ "single_word": false,
1489
+ "special": true
1490
+ },
1491
+ "200107": {
1492
+ "content": "L2C",
1493
+ "lstrip": false,
1494
+ "normalized": false,
1495
+ "rstrip": false,
1496
+ "single_word": false,
1497
+ "special": true
1498
+ },
1499
+ "200108": {
1500
+ "content": "L2mDIR",
1501
+ "lstrip": false,
1502
+ "normalized": false,
1503
+ "rstrip": false,
1504
+ "single_word": false,
1505
+ "special": true
1506
+ },
1507
+ "200109": {
1508
+ "content": "L2vDIR",
1509
+ "lstrip": false,
1510
+ "normalized": false,
1511
+ "rstrip": false,
1512
+ "single_word": false,
1513
+ "special": true
1514
+ },
1515
+ "200110": {
1516
+ "content": "LBIST",
1517
+ "lstrip": false,
1518
+ "normalized": false,
1519
+ "rstrip": false,
1520
+ "single_word": false,
1521
+ "special": true
1522
+ },
1523
+ "200111": {
1524
+ "content": "LDC",
1525
+ "lstrip": false,
1526
+ "normalized": false,
1527
+ "rstrip": false,
1528
+ "single_word": false,
1529
+ "special": true
1530
+ },
1531
+ "200112": {
1532
+ "content": "LFT",
1533
+ "lstrip": false,
1534
+ "normalized": false,
1535
+ "rstrip": false,
1536
+ "single_word": false,
1537
+ "special": true
1538
+ },
1539
+ "200113": {
1540
+ "content": "LIP",
1541
+ "lstrip": false,
1542
+ "normalized": false,
1543
+ "rstrip": false,
1544
+ "single_word": false,
1545
+ "special": true
1546
+ },
1547
+ "200114": {
1548
+ "content": "LSB",
1549
+ "lstrip": false,
1550
+ "normalized": false,
1551
+ "rstrip": false,
1552
+ "single_word": false,
1553
+ "special": true
1554
+ },
1555
+ "200115": {
1556
+ "content": "MAQ",
1557
+ "lstrip": false,
1558
+ "normalized": false,
1559
+ "rstrip": false,
1560
+ "single_word": false,
1561
+ "special": true
1562
+ },
1563
+ "200116": {
1564
+ "content": "MBIST",
1565
+ "lstrip": false,
1566
+ "normalized": false,
1567
+ "rstrip": false,
1568
+ "single_word": false,
1569
+ "special": true
1570
+ },
1571
+ "200117": {
1572
+ "content": "MCAL",
1573
+ "lstrip": false,
1574
+ "normalized": false,
1575
+ "rstrip": false,
1576
+ "single_word": false,
1577
+ "special": true
1578
+ },
1579
+ "200118": {
1580
+ "content": "MCE",
1581
+ "lstrip": false,
1582
+ "normalized": false,
1583
+ "rstrip": false,
1584
+ "single_word": false,
1585
+ "special": true
1586
+ },
1587
+ "200119": {
1588
+ "content": "MCU",
1589
+ "lstrip": false,
1590
+ "normalized": false,
1591
+ "rstrip": false,
1592
+ "single_word": false,
1593
+ "special": true
1594
+ },
1595
+ "200120": {
1596
+ "content": "MSB",
1597
+ "lstrip": false,
1598
+ "normalized": false,
1599
+ "rstrip": false,
1600
+ "single_word": false,
1601
+ "special": true
1602
+ },
1603
+ "200121": {
1604
+ "content": "MSS",
1605
+ "lstrip": false,
1606
+ "normalized": false,
1607
+ "rstrip": false,
1608
+ "single_word": false,
1609
+ "special": true
1610
+ },
1611
+ "200122": {
1612
+ "content": "MST",
1613
+ "lstrip": false,
1614
+ "normalized": false,
1615
+ "rstrip": false,
1616
+ "single_word": false,
1617
+ "special": true
1618
+ },
1619
+ "200123": {
1620
+ "content": "MTS",
1621
+ "lstrip": false,
1622
+ "normalized": false,
1623
+ "rstrip": false,
1624
+ "single_word": false,
1625
+ "special": true
1626
+ },
1627
+ "200124": {
1628
+ "content": "MiTM",
1629
+ "lstrip": false,
1630
+ "normalized": false,
1631
+ "rstrip": false,
1632
+ "single_word": false,
1633
+ "special": true
1634
+ },
1635
+ "200125": {
1636
+ "content": "NIP",
1637
+ "lstrip": false,
1638
+ "normalized": false,
1639
+ "rstrip": false,
1640
+ "single_word": false,
1641
+ "special": true
1642
+ },
1643
+ "200126": {
1644
+ "content": "NIST",
1645
+ "lstrip": false,
1646
+ "normalized": false,
1647
+ "rstrip": false,
1648
+ "single_word": false,
1649
+ "special": true
1650
+ },
1651
+ "200127": {
1652
+ "content": "NITO",
1653
+ "lstrip": false,
1654
+ "normalized": false,
1655
+ "rstrip": false,
1656
+ "single_word": false,
1657
+ "special": true
1658
+ },
1659
+ "200128": {
1660
+ "content": "NOC",
1661
+ "lstrip": false,
1662
+ "normalized": false,
1663
+ "rstrip": false,
1664
+ "single_word": false,
1665
+ "special": true
1666
+ },
1667
+ "200129": {
1668
+ "content": "NOOP",
1669
+ "lstrip": false,
1670
+ "normalized": false,
1671
+ "rstrip": false,
1672
+ "single_word": false,
1673
+ "special": true
1674
+ },
1675
+ "200130": {
1676
+ "content": "NVDEC",
1677
+ "lstrip": false,
1678
+ "normalized": false,
1679
+ "rstrip": false,
1680
+ "single_word": false,
1681
+ "special": true
1682
+ },
1683
+ "200131": {
1684
+ "content": "NVENC",
1685
+ "lstrip": false,
1686
+ "normalized": false,
1687
+ "rstrip": false,
1688
+ "single_word": false,
1689
+ "special": true
1690
+ },
1691
+ "200132": {
1692
+ "content": "NVJPG",
1693
+ "lstrip": false,
1694
+ "normalized": false,
1695
+ "rstrip": false,
1696
+ "single_word": false,
1697
+ "special": true
1698
+ },
1699
+ "200133": {
1700
+ "content": "NVM",
1701
+ "lstrip": false,
1702
+ "normalized": false,
1703
+ "rstrip": false,
1704
+ "single_word": false,
1705
+ "special": true
1706
+ },
1707
+ "200134": {
1708
+ "content": "NVVSE",
1709
+ "lstrip": false,
1710
+ "normalized": false,
1711
+ "rstrip": false,
1712
+ "single_word": false,
1713
+ "special": true
1714
+ },
1715
+ "200135": {
1716
+ "content": "OFA",
1717
+ "lstrip": false,
1718
+ "normalized": false,
1719
+ "rstrip": false,
1720
+ "single_word": false,
1721
+ "special": true
1722
+ },
1723
+ "200136": {
1724
+ "content": "PCIE",
1725
+ "lstrip": false,
1726
+ "normalized": false,
1727
+ "rstrip": false,
1728
+ "single_word": false,
1729
+ "special": true
1730
+ },
1731
+ "200137": {
1732
+ "content": "PCPU",
1733
+ "lstrip": false,
1734
+ "normalized": false,
1735
+ "rstrip": false,
1736
+ "single_word": false,
1737
+ "special": true
1738
+ },
1739
+ "200138": {
1740
+ "content": "PCT",
1741
+ "lstrip": false,
1742
+ "normalized": false,
1743
+ "rstrip": false,
1744
+ "single_word": false,
1745
+ "special": true
1746
+ },
1747
+ "200139": {
1748
+ "content": "PDK",
1749
+ "lstrip": false,
1750
+ "normalized": false,
1751
+ "rstrip": false,
1752
+ "single_word": false,
1753
+ "special": true
1754
+ },
1755
+ "200140": {
1756
+ "content": "PII",
1757
+ "lstrip": false,
1758
+ "normalized": false,
1759
+ "rstrip": false,
1760
+ "single_word": false,
1761
+ "special": true
1762
+ },
1763
+ "200141": {
1764
+ "content": "PIP",
1765
+ "lstrip": false,
1766
+ "normalized": false,
1767
+ "rstrip": false,
1768
+ "single_word": false,
1769
+ "special": true
1770
+ },
1771
+ "200142": {
1772
+ "content": "PKC",
1773
+ "lstrip": false,
1774
+ "normalized": false,
1775
+ "rstrip": false,
1776
+ "single_word": false,
1777
+ "special": true
1778
+ },
1779
+ "200143": {
1780
+ "content": "PKCS",
1781
+ "lstrip": false,
1782
+ "normalized": false,
1783
+ "rstrip": false,
1784
+ "single_word": false,
1785
+ "special": true
1786
+ },
1787
+ "200144": {
1788
+ "content": "PKI",
1789
+ "lstrip": false,
1790
+ "normalized": false,
1791
+ "rstrip": false,
1792
+ "single_word": false,
1793
+ "special": true
1794
+ },
1795
+ "200145": {
1796
+ "content": "PPC",
1797
+ "lstrip": false,
1798
+ "normalized": false,
1799
+ "rstrip": false,
1800
+ "single_word": false,
1801
+ "special": true
1802
+ },
1803
+ "200146": {
1804
+ "content": "PTXT",
1805
+ "lstrip": false,
1806
+ "normalized": false,
1807
+ "rstrip": false,
1808
+ "single_word": false,
1809
+ "special": true
1810
+ },
1811
+ "200147": {
1812
+ "content": "PVA",
1813
+ "lstrip": false,
1814
+ "normalized": false,
1815
+ "rstrip": false,
1816
+ "single_word": false,
1817
+ "special": true
1818
+ },
1819
+ "200148": {
1820
+ "content": "QNX",
1821
+ "lstrip": false,
1822
+ "normalized": false,
1823
+ "rstrip": false,
1824
+ "single_word": false,
1825
+ "special": true
1826
+ },
1827
+ "200149": {
1828
+ "content": "QOS",
1829
+ "lstrip": false,
1830
+ "normalized": false,
1831
+ "rstrip": false,
1832
+ "single_word": false,
1833
+ "special": true
1834
+ },
1835
+ "200150": {
1836
+ "content": "QSPI",
1837
+ "lstrip": false,
1838
+ "normalized": false,
1839
+ "rstrip": false,
1840
+ "single_word": false,
1841
+ "special": true
1842
+ },
1843
+ "200151": {
1844
+ "content": "RBG",
1845
+ "lstrip": false,
1846
+ "normalized": false,
1847
+ "rstrip": false,
1848
+ "single_word": false,
1849
+ "special": true
1850
+ },
1851
+ "200152": {
1852
+ "content": "RBR",
1853
+ "lstrip": false,
1854
+ "normalized": false,
1855
+ "rstrip": false,
1856
+ "single_word": false,
1857
+ "special": true
1858
+ },
1859
+ "200153": {
1860
+ "content": "RDEV",
1861
+ "lstrip": false,
1862
+ "normalized": false,
1863
+ "rstrip": false,
1864
+ "single_word": false,
1865
+ "special": true
1866
+ },
1867
+ "200154": {
1868
+ "content": "RMA",
1869
+ "lstrip": false,
1870
+ "normalized": false,
1871
+ "rstrip": false,
1872
+ "single_word": false,
1873
+ "special": true
1874
+ },
1875
+ "200155": {
1876
+ "content": "RMW",
1877
+ "lstrip": false,
1878
+ "normalized": false,
1879
+ "rstrip": false,
1880
+ "single_word": false,
1881
+ "special": true
1882
+ },
1883
+ "200156": {
1884
+ "content": "RSB",
1885
+ "lstrip": false,
1886
+ "normalized": false,
1887
+ "rstrip": false,
1888
+ "single_word": false,
1889
+ "special": true
1890
+ },
1891
+ "200157": {
1892
+ "content": "RTS",
1893
+ "lstrip": false,
1894
+ "normalized": false,
1895
+ "rstrip": false,
1896
+ "single_word": false,
1897
+ "special": true
1898
+ },
1899
+ "200158": {
1900
+ "content": "RoT",
1901
+ "lstrip": false,
1902
+ "normalized": false,
1903
+ "rstrip": false,
1904
+ "single_word": false,
1905
+ "special": true
1906
+ },
1907
+ "200159": {
1908
+ "content": "SAE",
1909
+ "lstrip": false,
1910
+ "normalized": false,
1911
+ "rstrip": false,
1912
+ "single_word": false,
1913
+ "special": true
1914
+ },
1915
+ "200160": {
1916
+ "content": "SBK",
1917
+ "lstrip": false,
1918
+ "normalized": false,
1919
+ "rstrip": false,
1920
+ "single_word": false,
1921
+ "special": true
1922
+ },
1923
+ "200161": {
1924
+ "content": "SEL0",
1925
+ "lstrip": false,
1926
+ "normalized": false,
1927
+ "rstrip": false,
1928
+ "single_word": false,
1929
+ "special": true
1930
+ },
1931
+ "200162": {
1932
+ "content": "SEL1",
1933
+ "lstrip": false,
1934
+ "normalized": false,
1935
+ "rstrip": false,
1936
+ "single_word": false,
1937
+ "special": true
1938
+ },
1939
+ "200163": {
1940
+ "content": "SEooC",
1941
+ "lstrip": false,
1942
+ "normalized": false,
1943
+ "rstrip": false,
1944
+ "single_word": false,
1945
+ "special": true
1946
+ },
1947
+ "200164": {
1948
+ "content": "SGM",
1949
+ "lstrip": false,
1950
+ "normalized": false,
1951
+ "rstrip": false,
1952
+ "single_word": false,
1953
+ "special": true
1954
+ },
1955
+ "200165": {
1956
+ "content": "SHA256",
1957
+ "lstrip": false,
1958
+ "normalized": false,
1959
+ "rstrip": false,
1960
+ "single_word": false,
1961
+ "special": true
1962
+ },
1963
+ "200166": {
1964
+ "content": "SHA512",
1965
+ "lstrip": false,
1966
+ "normalized": false,
1967
+ "rstrip": false,
1968
+ "single_word": false,
1969
+ "special": true
1970
+ },
1971
+ "200167": {
1972
+ "content": "SHE",
1973
+ "lstrip": false,
1974
+ "normalized": false,
1975
+ "rstrip": false,
1976
+ "single_word": false,
1977
+ "special": true
1978
+ },
1979
+ "200168": {
1980
+ "content": "SNOC",
1981
+ "lstrip": false,
1982
+ "normalized": false,
1983
+ "rstrip": false,
1984
+ "single_word": false,
1985
+ "special": true
1986
+ },
1987
+ "200169": {
1988
+ "content": "SST",
1989
+ "lstrip": false,
1990
+ "normalized": false,
1991
+ "rstrip": false,
1992
+ "single_word": false,
1993
+ "special": true
1994
+ },
1995
+ "200170": {
1996
+ "content": "SWAT",
1997
+ "lstrip": false,
1998
+ "normalized": false,
1999
+ "rstrip": false,
2000
+ "single_word": false,
2001
+ "special": true
2002
+ },
2003
+ "200171": {
2004
+ "content": "SoC",
2005
+ "lstrip": false,
2006
+ "normalized": false,
2007
+ "rstrip": false,
2008
+ "single_word": false,
2009
+ "special": true
2010
+ },
2011
+ "200172": {
2012
+ "content": "TCF",
2013
+ "lstrip": false,
2014
+ "normalized": false,
2015
+ "rstrip": false,
2016
+ "single_word": false,
2017
+ "special": true
2018
+ },
2019
+ "200173": {
2020
+ "content": "THI",
2021
+ "lstrip": false,
2022
+ "normalized": false,
2023
+ "rstrip": false,
2024
+ "single_word": false,
2025
+ "special": true
2026
+ },
2027
+ "200174": {
2028
+ "content": "TNR",
2029
+ "lstrip": false,
2030
+ "normalized": false,
2031
+ "rstrip": false,
2032
+ "single_word": false,
2033
+ "special": true
2034
+ },
2035
+ "200175": {
2036
+ "content": "TOS",
2037
+ "lstrip": false,
2038
+ "normalized": false,
2039
+ "rstrip": false,
2040
+ "single_word": false,
2041
+ "special": true
2042
+ },
2043
+ "200176": {
2044
+ "content": "TRC",
2045
+ "lstrip": false,
2046
+ "normalized": false,
2047
+ "rstrip": false,
2048
+ "single_word": false,
2049
+ "special": true
2050
+ },
2051
+ "200177": {
2052
+ "content": "TSEC",
2053
+ "lstrip": false,
2054
+ "normalized": false,
2055
+ "rstrip": false,
2056
+ "single_word": false,
2057
+ "special": true
2058
+ },
2059
+ "200178": {
2060
+ "content": "UFS",
2061
+ "lstrip": false,
2062
+ "normalized": false,
2063
+ "rstrip": false,
2064
+ "single_word": false,
2065
+ "special": true
2066
+ },
2067
+ "200179": {
2068
+ "content": "VBR",
2069
+ "lstrip": false,
2070
+ "normalized": false,
2071
+ "rstrip": false,
2072
+ "single_word": false,
2073
+ "special": true
2074
+ },
2075
+ "200180": {
2076
+ "content": "VCPU",
2077
+ "lstrip": false,
2078
+ "normalized": false,
2079
+ "rstrip": false,
2080
+ "single_word": false,
2081
+ "special": true
2082
+ },
2083
+ "200181": {
2084
+ "content": "VIC",
2085
+ "lstrip": false,
2086
+ "normalized": false,
2087
+ "rstrip": false,
2088
+ "single_word": false,
2089
+ "special": true
2090
+ },
2091
+ "200182": {
2092
+ "content": "VMEM",
2093
+ "lstrip": false,
2094
+ "normalized": false,
2095
+ "rstrip": false,
2096
+ "single_word": false,
2097
+ "special": true
2098
+ },
2099
+ "200183": {
2100
+ "content": "VMID",
2101
+ "lstrip": false,
2102
+ "normalized": false,
2103
+ "rstrip": false,
2104
+ "single_word": false,
2105
+ "special": true
2106
+ },
2107
+ "200184": {
2108
+ "content": "VPU",
2109
+ "lstrip": false,
2110
+ "normalized": false,
2111
+ "rstrip": false,
2112
+ "single_word": false,
2113
+ "special": true
2114
+ },
2115
+ "200185": {
2116
+ "content": "VRC",
2117
+ "lstrip": false,
2118
+ "normalized": false,
2119
+ "rstrip": false,
2120
+ "single_word": false,
2121
+ "special": true
2122
+ },
2123
+ "200186": {
2124
+ "content": "VUI",
2125
+ "lstrip": false,
2126
+ "normalized": false,
2127
+ "rstrip": false,
2128
+ "single_word": false,
2129
+ "special": true
2130
+ },
2131
+ "200187": {
2132
+ "content": "WARB",
2133
+ "lstrip": false,
2134
+ "normalized": false,
2135
+ "rstrip": false,
2136
+ "single_word": false,
2137
+ "special": true
2138
+ },
2139
+ "200188": {
2140
+ "content": "XIP",
2141
+ "lstrip": false,
2142
+ "normalized": false,
2143
+ "rstrip": false,
2144
+ "single_word": false,
2145
+ "special": true
2146
+ },
2147
+ "200189": {
2148
+ "content": "bpp",
2149
+ "lstrip": false,
2150
+ "normalized": false,
2151
+ "rstrip": false,
2152
+ "single_word": false,
2153
+ "special": true
2154
+ },
2155
+ "200190": {
2156
+ "content": "eMMC",
2157
+ "lstrip": false,
2158
+ "normalized": false,
2159
+ "rstrip": false,
2160
+ "single_word": false,
2161
+ "special": true
2162
+ },
2163
+ "200191": {
2164
+ "content": "hfPLA",
2165
+ "lstrip": false,
2166
+ "normalized": false,
2167
+ "rstrip": false,
2168
+ "single_word": false,
2169
+ "special": true
2170
+ },
2171
+ "200192": {
2172
+ "content": "iGPU",
2173
+ "lstrip": false,
2174
+ "normalized": false,
2175
+ "rstrip": false,
2176
+ "single_word": false,
2177
+ "special": true
2178
+ },
2179
+ "200193": {
2180
+ "content": "ipc_fg",
2181
+ "lstrip": false,
2182
+ "normalized": false,
2183
+ "rstrip": false,
2184
+ "single_word": false,
2185
+ "special": true
2186
+ },
2187
+ "200194": {
2188
+ "content": "ipc_t",
2189
+ "lstrip": false,
2190
+ "normalized": false,
2191
+ "rstrip": false,
2192
+ "single_word": false,
2193
+ "special": true
2194
+ },
2195
+ "200195": {
2196
+ "content": "sbPLA",
2197
+ "lstrip": false,
2198
+ "normalized": false,
2199
+ "rstrip": false,
2200
+ "single_word": false,
2201
+ "special": true
2202
+ },
2203
+ "200196": {
2204
+ "content": "xBTV",
2205
+ "lstrip": false,
2206
+ "normalized": false,
2207
+ "rstrip": false,
2208
+ "single_word": false,
2209
+ "special": true
2210
+ },
2211
+ "200197": {
2212
+ "content": "xps",
2213
+ "lstrip": false,
2214
+ "normalized": false,
2215
+ "rstrip": false,
2216
+ "single_word": false,
2217
+ "special": true
2218
+ }
2219
+ },
2220
+ "additional_special_tokens": [
2221
+ "AAD",
2222
+ "AArch64",
2223
+ "ACL",
2224
+ "AD",
2225
+ "AES",
2226
+ "AES256GCM",
2227
+ "AESCBC",
2228
+ "AKE",
2229
+ "AON",
2230
+ "ASID",
2231
+ "AXI",
2232
+ "Acronym",
2233
+ "AoU",
2234
+ "AutoSar",
2235
+ "BAM",
2236
+ "BCH",
2237
+ "BIST",
2238
+ "BOM",
2239
+ "BPMP",
2240
+ "BPS",
2241
+ "BPU",
2242
+ "BRBCT",
2243
+ "BW",
2244
+ "C2C",
2245
+ "CA",
2246
+ "CAN",
2247
+ "CANFD",
2248
+ "CAR",
2249
+ "CAVP",
2250
+ "CBB",
2251
+ "CBC",
2252
+ "CBR",
2253
+ "CCM",
2254
+ "CCPLEX",
2255
+ "CCPLEX_L2",
2256
+ "CCPLEX_MISC",
2257
+ "CCPLEX_SCF",
2258
+ "CDD",
2259
+ "CIF",
2260
+ "CMAC",
2261
+ "CPE",
2262
+ "CPU",
2263
+ "CRC",
2264
+ "CSI",
2265
+ "CSP",
2266
+ "CTR",
2267
+ "CTXT",
2268
+ "CV",
2269
+ "DBB",
2270
+ "DEP",
2271
+ "DEV",
2272
+ "DFA",
2273
+ "DFT",
2274
+ "DIP",
2275
+ "DISPLAY",
2276
+ "DLA",
2277
+ "DMA",
2278
+ "DMEM",
2279
+ "DPA",
2280
+ "DSC",
2281
+ "DT",
2282
+ "DU",
2283
+ "DVMU",
2284
+ "EC",
2285
+ "ECB",
2286
+ "ECC",
2287
+ "ECDHE",
2288
+ "ECDSA",
2289
+ "ECID",
2290
+ "EDR",
2291
+ "EOF",
2292
+ "EOTTI",
2293
+ "EQoS",
2294
+ "FCL",
2295
+ "FHTI",
2296
+ "FIPS",
2297
+ "FMEA",
2298
+ "FMON",
2299
+ "FO",
2300
+ "FP",
2301
+ "FPS",
2302
+ "FW",
2303
+ "FuSa",
2304
+ "GCM",
2305
+ "GFD",
2306
+ "GIC",
2307
+ "GMAC",
2308
+ "GMSL",
2309
+ "GOP",
2310
+ "GP",
2311
+ "GPCDMA",
2312
+ "GPU",
2313
+ "GR",
2314
+ "Gpps",
2315
+ "HBR",
2316
+ "HBR2",
2317
+ "HBR3",
2318
+ "HDS",
2319
+ "HIS",
2320
+ "HMAC",
2321
+ "HPSE",
2322
+ "HSI",
2323
+ "HSM",
2324
+ "HSP",
2325
+ "HW",
2326
+ "IAS",
2327
+ "IC",
2328
+ "ICD",
2329
+ "IDR",
2330
+ "IDT",
2331
+ "IEP",
2332
+ "IEU",
2333
+ "IFU",
2334
+ "IID",
2335
+ "ILD",
2336
+ "IMEM",
2337
+ "IOC",
2338
+ "IOFA",
2339
+ "IOMMU",
2340
+ "IPC",
2341
+ "IPI",
2342
+ "IRF",
2343
+ "IST",
2344
+ "IV",
2345
+ "IoT",
2346
+ "JSR",
2347
+ "KAT",
2348
+ "KCV",
2349
+ "KDF",
2350
+ "KPI",
2351
+ "L1PT",
2352
+ "L2C",
2353
+ "L2mDIR",
2354
+ "L2vDIR",
2355
+ "LAB",
2356
+ "LBIST",
2357
+ "LDC",
2358
+ "LFT",
2359
+ "LIC",
2360
+ "LIP",
2361
+ "LSB",
2362
+ "MAC",
2363
+ "MAQ",
2364
+ "MB",
2365
+ "MBIST",
2366
+ "MCAL",
2367
+ "MCE",
2368
+ "MCU",
2369
+ "MSB",
2370
+ "MSS",
2371
+ "MST",
2372
+ "MTS",
2373
+ "MiTM",
2374
+ "NIP",
2375
+ "NIST",
2376
+ "NITO",
2377
+ "NOC",
2378
+ "NOOP",
2379
+ "NT",
2380
+ "NVDEC",
2381
+ "NVENC",
2382
+ "NVJPG",
2383
+ "NVM",
2384
+ "NVVSE",
2385
+ "OEM",
2386
+ "OFA",
2387
+ "OS",
2388
+ "OSP",
2389
+ "OTP",
2390
+ "PB",
2391
+ "PCIE",
2392
+ "PCPU",
2393
+ "PCR",
2394
+ "PCT",
2395
+ "PDK",
2396
+ "PII",
2397
+ "PIP",
2398
+ "PKC",
2399
+ "PKCS",
2400
+ "PKI",
2401
+ "PL",
2402
+ "PLA",
2403
+ "POR",
2404
+ "PPC",
2405
+ "PSC",
2406
+ "PTXT",
2407
+ "PVA",
2408
+ "QNX",
2409
+ "QOS",
2410
+ "QSPI",
2411
+ "RBG",
2412
+ "RBR",
2413
+ "RC",
2414
+ "RDEV",
2415
+ "REE",
2416
+ "RMA",
2417
+ "RMW",
2418
+ "RSA",
2419
+ "RSB",
2420
+ "RTS",
2421
+ "RoT",
2422
+ "SAE",
2423
+ "SBK",
2424
+ "SCH",
2425
+ "SDK",
2426
+ "SE",
2427
+ "SEL0",
2428
+ "SEL1",
2429
+ "SEooC",
2430
+ "SGM",
2431
+ "SHA",
2432
+ "SHA256",
2433
+ "SHA512",
2434
+ "SHE",
2435
+ "SKU",
2436
+ "SNOC",
2437
+ "SO",
2438
+ "SPA",
2439
+ "SQ",
2440
+ "SSR",
2441
+ "SST",
2442
+ "SW",
2443
+ "SWAT",
2444
+ "SoC",
2445
+ "TA",
2446
+ "TCF",
2447
+ "TEE",
2448
+ "THI",
2449
+ "TNR",
2450
+ "TOS",
2451
+ "TRC",
2452
+ "TRL",
2453
+ "TSEC",
2454
+ "TZ",
2455
+ "UFS",
2456
+ "VBR",
2457
+ "VCPU",
2458
+ "VI",
2459
+ "VIC",
2460
+ "VMEM",
2461
+ "VMID",
2462
+ "VPU",
2463
+ "VRC",
2464
+ "VUI",
2465
+ "WARB",
2466
+ "XIP",
2467
+ "bpp",
2468
+ "eMMC",
2469
+ "hfPLA",
2470
+ "iGPU",
2471
+ "ipc",
2472
+ "ipc_fg",
2473
+ "ipc_t",
2474
+ "sbPLA",
2475
+ "xBTV",
2476
+ "xps"
2477
+ ],
2478
+ "bos_token": "<|startoftext|>",
2479
+ "clean_up_tokenization_spaces": false,
2480
+ "eos_token": "<|return|>",
2481
+ "extra_special_tokens": {},
2482
+ "model_input_names": [
2483
+ "input_ids",
2484
+ "attention_mask"
2485
+ ],
2486
+ "model_max_length": 1000000000000000019884624838656,
2487
+ "pad_token": "<|endoftext|>",
2488
+ "tokenizer_class": "PreTrainedTokenizerFast"
2489
+ }
checkpoint-3284/trainer_state.json ADDED
@@ -0,0 +1,2986 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 2.0,
6
+ "eval_steps": 500,
7
+ "global_step": 3284,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.0060901339829476245,
14
+ "grad_norm": 23.5319766998291,
15
+ "learning_rate": 1.2162162162162164e-05,
16
+ "loss": 4.5905,
17
+ "mean_token_accuracy": 0.3401473943144083,
18
+ "num_tokens": 132681.0,
19
+ "step": 10
20
+ },
21
+ {
22
+ "epoch": 0.012180267965895249,
23
+ "grad_norm": 6.916630744934082,
24
+ "learning_rate": 2.5675675675675675e-05,
25
+ "loss": 3.957,
26
+ "mean_token_accuracy": 0.3799716055393219,
27
+ "num_tokens": 264238.0,
28
+ "step": 20
29
+ },
30
+ {
31
+ "epoch": 0.018270401948842874,
32
+ "grad_norm": 2.717982292175293,
33
+ "learning_rate": 3.918918918918919e-05,
34
+ "loss": 3.047,
35
+ "mean_token_accuracy": 0.46811963245272636,
36
+ "num_tokens": 401308.0,
37
+ "step": 30
38
+ },
39
+ {
40
+ "epoch": 0.024360535931790498,
41
+ "grad_norm": 2.407865524291992,
42
+ "learning_rate": 5.27027027027027e-05,
43
+ "loss": 2.5322,
44
+ "mean_token_accuracy": 0.5190828196704388,
45
+ "num_tokens": 532444.0,
46
+ "step": 40
47
+ },
48
+ {
49
+ "epoch": 0.030450669914738125,
50
+ "grad_norm": 1.018301248550415,
51
+ "learning_rate": 6.621621621621621e-05,
52
+ "loss": 2.1325,
53
+ "mean_token_accuracy": 0.5782605841755867,
54
+ "num_tokens": 660406.0,
55
+ "step": 50
56
+ },
57
+ {
58
+ "epoch": 0.03654080389768575,
59
+ "grad_norm": 0.7315741181373596,
60
+ "learning_rate": 7.972972972972974e-05,
61
+ "loss": 1.9044,
62
+ "mean_token_accuracy": 0.6264914631843567,
63
+ "num_tokens": 795304.0,
64
+ "step": 60
65
+ },
66
+ {
67
+ "epoch": 0.04263093788063337,
68
+ "grad_norm": 0.6652920246124268,
69
+ "learning_rate": 9.324324324324324e-05,
70
+ "loss": 1.633,
71
+ "mean_token_accuracy": 0.6683938711881637,
72
+ "num_tokens": 934543.0,
73
+ "step": 70
74
+ },
75
+ {
76
+ "epoch": 0.048721071863580996,
77
+ "grad_norm": 0.6119660139083862,
78
+ "learning_rate": 0.00010675675675675677,
79
+ "loss": 1.543,
80
+ "mean_token_accuracy": 0.6834091022610664,
81
+ "num_tokens": 1070669.0,
82
+ "step": 80
83
+ },
84
+ {
85
+ "epoch": 0.05481120584652863,
86
+ "grad_norm": 0.591424286365509,
87
+ "learning_rate": 0.00012027027027027027,
88
+ "loss": 1.4154,
89
+ "mean_token_accuracy": 0.6991497233510018,
90
+ "num_tokens": 1211114.0,
91
+ "step": 90
92
+ },
93
+ {
94
+ "epoch": 0.06090133982947625,
95
+ "grad_norm": 0.5663530230522156,
96
+ "learning_rate": 0.0001337837837837838,
97
+ "loss": 1.3176,
98
+ "mean_token_accuracy": 0.7089206710457802,
99
+ "num_tokens": 1349584.0,
100
+ "step": 100
101
+ },
102
+ {
103
+ "epoch": 0.06699147381242387,
104
+ "grad_norm": 0.5881878137588501,
105
+ "learning_rate": 0.0001472972972972973,
106
+ "loss": 1.2293,
107
+ "mean_token_accuracy": 0.7254403859376908,
108
+ "num_tokens": 1487515.0,
109
+ "step": 110
110
+ },
111
+ {
112
+ "epoch": 0.0730816077953715,
113
+ "grad_norm": 0.7664394974708557,
114
+ "learning_rate": 0.00016081081081081083,
115
+ "loss": 1.1814,
116
+ "mean_token_accuracy": 0.7306812778115273,
117
+ "num_tokens": 1618603.0,
118
+ "step": 120
119
+ },
120
+ {
121
+ "epoch": 0.07917174177831912,
122
+ "grad_norm": 0.6155670881271362,
123
+ "learning_rate": 0.00017432432432432432,
124
+ "loss": 1.1967,
125
+ "mean_token_accuracy": 0.7284250959753991,
126
+ "num_tokens": 1750466.0,
127
+ "step": 130
128
+ },
129
+ {
130
+ "epoch": 0.08526187576126674,
131
+ "grad_norm": 0.5296258330345154,
132
+ "learning_rate": 0.00018783783783783784,
133
+ "loss": 1.0955,
134
+ "mean_token_accuracy": 0.7472824215888977,
135
+ "num_tokens": 1887913.0,
136
+ "step": 140
137
+ },
138
+ {
139
+ "epoch": 0.09135200974421437,
140
+ "grad_norm": 0.5564976334571838,
141
+ "learning_rate": 0.00019999998054550544,
142
+ "loss": 1.118,
143
+ "mean_token_accuracy": 0.7397311359643937,
144
+ "num_tokens": 2018579.0,
145
+ "step": 150
146
+ },
147
+ {
148
+ "epoch": 0.09744214372716199,
149
+ "grad_norm": 0.5301142930984497,
150
+ "learning_rate": 0.00019999764601633156,
151
+ "loss": 1.045,
152
+ "mean_token_accuracy": 0.7519380420446395,
153
+ "num_tokens": 2158851.0,
154
+ "step": 160
155
+ },
156
+ {
157
+ "epoch": 0.10353227771010962,
158
+ "grad_norm": 0.5949111580848694,
159
+ "learning_rate": 0.00019999142070388495,
160
+ "loss": 1.0497,
161
+ "mean_token_accuracy": 0.7520910769701004,
162
+ "num_tokens": 2296715.0,
163
+ "step": 170
164
+ },
165
+ {
166
+ "epoch": 0.10962241169305725,
167
+ "grad_norm": 0.6169262528419495,
168
+ "learning_rate": 0.0001999813048772986,
169
+ "loss": 1.0821,
170
+ "mean_token_accuracy": 0.7406247839331627,
171
+ "num_tokens": 2424756.0,
172
+ "step": 180
173
+ },
174
+ {
175
+ "epoch": 0.11571254567600488,
176
+ "grad_norm": 0.58912593126297,
177
+ "learning_rate": 0.00019996729897390057,
178
+ "loss": 1.0286,
179
+ "mean_token_accuracy": 0.7527454376220704,
180
+ "num_tokens": 2559362.0,
181
+ "step": 190
182
+ },
183
+ {
184
+ "epoch": 0.1218026796589525,
185
+ "grad_norm": 0.5084304213523865,
186
+ "learning_rate": 0.00019994940359919483,
187
+ "loss": 0.992,
188
+ "mean_token_accuracy": 0.7640391126275062,
189
+ "num_tokens": 2700231.0,
190
+ "step": 200
191
+ },
192
+ {
193
+ "epoch": 0.1278928136419001,
194
+ "grad_norm": 0.5790796279907227,
195
+ "learning_rate": 0.00019992761952683516,
196
+ "loss": 1.0146,
197
+ "mean_token_accuracy": 0.7554366230964661,
198
+ "num_tokens": 2831324.0,
199
+ "step": 210
200
+ },
201
+ {
202
+ "epoch": 0.13398294762484775,
203
+ "grad_norm": 0.5852051377296448,
204
+ "learning_rate": 0.00019990194769859188,
205
+ "loss": 0.978,
206
+ "mean_token_accuracy": 0.7612502485513687,
207
+ "num_tokens": 2967346.0,
208
+ "step": 220
209
+ },
210
+ {
211
+ "epoch": 0.14007308160779536,
212
+ "grad_norm": 0.5102785229682922,
213
+ "learning_rate": 0.00019987238922431088,
214
+ "loss": 0.9616,
215
+ "mean_token_accuracy": 0.7677591517567635,
216
+ "num_tokens": 3110936.0,
217
+ "step": 230
218
+ },
219
+ {
220
+ "epoch": 0.146163215590743,
221
+ "grad_norm": 0.5472669005393982,
222
+ "learning_rate": 0.00019983894538186576,
223
+ "loss": 0.9535,
224
+ "mean_token_accuracy": 0.76737689524889,
225
+ "num_tokens": 3247496.0,
226
+ "step": 240
227
+ },
228
+ {
229
+ "epoch": 0.15225334957369063,
230
+ "grad_norm": 0.5611053109169006,
231
+ "learning_rate": 0.0001998016176171026,
232
+ "loss": 0.9577,
233
+ "mean_token_accuracy": 0.7626092001795769,
234
+ "num_tokens": 3384178.0,
235
+ "step": 250
236
+ },
237
+ {
238
+ "epoch": 0.15834348355663824,
239
+ "grad_norm": 0.54055255651474,
240
+ "learning_rate": 0.0001997604075437774,
241
+ "loss": 0.9907,
242
+ "mean_token_accuracy": 0.7575223430991173,
243
+ "num_tokens": 3517617.0,
244
+ "step": 260
245
+ },
246
+ {
247
+ "epoch": 0.16443361753958588,
248
+ "grad_norm": 0.558316707611084,
249
+ "learning_rate": 0.0001997153169434864,
250
+ "loss": 0.944,
251
+ "mean_token_accuracy": 0.7664194419980049,
252
+ "num_tokens": 3662878.0,
253
+ "step": 270
254
+ },
255
+ {
256
+ "epoch": 0.1705237515225335,
257
+ "grad_norm": 0.49766939878463745,
258
+ "learning_rate": 0.0001996663477655889,
259
+ "loss": 0.9106,
260
+ "mean_token_accuracy": 0.7760038167238236,
261
+ "num_tokens": 3807411.0,
262
+ "step": 280
263
+ },
264
+ {
265
+ "epoch": 0.17661388550548113,
266
+ "grad_norm": 0.4953667223453522,
267
+ "learning_rate": 0.0001996135021271232,
268
+ "loss": 0.9687,
269
+ "mean_token_accuracy": 0.7605679705739021,
270
+ "num_tokens": 3936840.0,
271
+ "step": 290
272
+ },
273
+ {
274
+ "epoch": 0.18270401948842874,
275
+ "grad_norm": 0.5447947978973389,
276
+ "learning_rate": 0.00019955678231271484,
277
+ "loss": 0.9625,
278
+ "mean_token_accuracy": 0.7603292793035508,
279
+ "num_tokens": 4067826.0,
280
+ "step": 300
281
+ },
282
+ {
283
+ "epoch": 0.18879415347137637,
284
+ "grad_norm": 0.4665842056274414,
285
+ "learning_rate": 0.00019949619077447807,
286
+ "loss": 0.9372,
287
+ "mean_token_accuracy": 0.7676101759076118,
288
+ "num_tokens": 4205887.0,
289
+ "step": 310
290
+ },
291
+ {
292
+ "epoch": 0.19488428745432398,
293
+ "grad_norm": 0.515690267086029,
294
+ "learning_rate": 0.00019943173013190965,
295
+ "loss": 0.923,
296
+ "mean_token_accuracy": 0.7708473294973374,
297
+ "num_tokens": 4342894.0,
298
+ "step": 320
299
+ },
300
+ {
301
+ "epoch": 0.20097442143727162,
302
+ "grad_norm": 0.5831382274627686,
303
+ "learning_rate": 0.00019936340317177565,
304
+ "loss": 0.9203,
305
+ "mean_token_accuracy": 0.7708552837371826,
306
+ "num_tokens": 4477651.0,
307
+ "step": 330
308
+ },
309
+ {
310
+ "epoch": 0.20706455542021923,
311
+ "grad_norm": 0.6162773966789246,
312
+ "learning_rate": 0.0001992912128479911,
313
+ "loss": 0.916,
314
+ "mean_token_accuracy": 0.7702088996767997,
315
+ "num_tokens": 4610746.0,
316
+ "step": 340
317
+ },
318
+ {
319
+ "epoch": 0.21315468940316687,
320
+ "grad_norm": 0.5172462463378906,
321
+ "learning_rate": 0.00019921516228149207,
322
+ "loss": 0.8942,
323
+ "mean_token_accuracy": 0.7741821393370628,
324
+ "num_tokens": 4751175.0,
325
+ "step": 350
326
+ },
327
+ {
328
+ "epoch": 0.2192448233861145,
329
+ "grad_norm": 0.5890468955039978,
330
+ "learning_rate": 0.0001991352547601009,
331
+ "loss": 0.9229,
332
+ "mean_token_accuracy": 0.7691043332219124,
333
+ "num_tokens": 4882328.0,
334
+ "step": 360
335
+ },
336
+ {
337
+ "epoch": 0.22533495736906212,
338
+ "grad_norm": 0.5522404909133911,
339
+ "learning_rate": 0.00019905149373838408,
340
+ "loss": 0.9294,
341
+ "mean_token_accuracy": 0.7646071568131447,
342
+ "num_tokens": 5012181.0,
343
+ "step": 370
344
+ },
345
+ {
346
+ "epoch": 0.23142509135200975,
347
+ "grad_norm": 0.5349445939064026,
348
+ "learning_rate": 0.0001989638828375028,
349
+ "loss": 0.8797,
350
+ "mean_token_accuracy": 0.7771721839904785,
351
+ "num_tokens": 5151133.0,
352
+ "step": 380
353
+ },
354
+ {
355
+ "epoch": 0.23751522533495736,
356
+ "grad_norm": 0.531052827835083,
357
+ "learning_rate": 0.00019887242584505635,
358
+ "loss": 0.9221,
359
+ "mean_token_accuracy": 0.7678465083241462,
360
+ "num_tokens": 5279790.0,
361
+ "step": 390
362
+ },
363
+ {
364
+ "epoch": 0.243605359317905,
365
+ "grad_norm": 0.5126324892044067,
366
+ "learning_rate": 0.00019877712671491864,
367
+ "loss": 0.8862,
368
+ "mean_token_accuracy": 0.7739894777536392,
369
+ "num_tokens": 5412390.0,
370
+ "step": 400
371
+ },
372
+ {
373
+ "epoch": 0.2496954933008526,
374
+ "grad_norm": 0.5111438632011414,
375
+ "learning_rate": 0.00019867798956706693,
376
+ "loss": 0.9005,
377
+ "mean_token_accuracy": 0.7721902653574944,
378
+ "num_tokens": 5545801.0,
379
+ "step": 410
380
+ },
381
+ {
382
+ "epoch": 0.2557856272838002,
383
+ "grad_norm": 0.5488138794898987,
384
+ "learning_rate": 0.00019857501868740402,
385
+ "loss": 0.8988,
386
+ "mean_token_accuracy": 0.7690282896161079,
387
+ "num_tokens": 5673758.0,
388
+ "step": 420
389
+ },
390
+ {
391
+ "epoch": 0.2618757612667479,
392
+ "grad_norm": 0.5497994422912598,
393
+ "learning_rate": 0.0001984682185275727,
394
+ "loss": 0.8802,
395
+ "mean_token_accuracy": 0.7780183687806129,
396
+ "num_tokens": 5813158.0,
397
+ "step": 430
398
+ },
399
+ {
400
+ "epoch": 0.2679658952496955,
401
+ "grad_norm": 0.5478431582450867,
402
+ "learning_rate": 0.0001983575937047635,
403
+ "loss": 0.865,
404
+ "mean_token_accuracy": 0.7785944610834121,
405
+ "num_tokens": 5947367.0,
406
+ "step": 440
407
+ },
408
+ {
409
+ "epoch": 0.2740560292326431,
410
+ "grad_norm": 0.5188766717910767,
411
+ "learning_rate": 0.00019824314900151487,
412
+ "loss": 0.8798,
413
+ "mean_token_accuracy": 0.7752803862094879,
414
+ "num_tokens": 6081060.0,
415
+ "step": 450
416
+ },
417
+ {
418
+ "epoch": 0.2801461632155907,
419
+ "grad_norm": 0.530222475528717,
420
+ "learning_rate": 0.00019812488936550666,
421
+ "loss": 0.8628,
422
+ "mean_token_accuracy": 0.7801630645990372,
423
+ "num_tokens": 6217834.0,
424
+ "step": 460
425
+ },
426
+ {
427
+ "epoch": 0.2862362971985384,
428
+ "grad_norm": 0.5987964868545532,
429
+ "learning_rate": 0.00019800281990934614,
430
+ "loss": 0.8775,
431
+ "mean_token_accuracy": 0.7760324433445931,
432
+ "num_tokens": 6350451.0,
433
+ "step": 470
434
+ },
435
+ {
436
+ "epoch": 0.292326431181486,
437
+ "grad_norm": 0.5468559265136719,
438
+ "learning_rate": 0.0001978769459103468,
439
+ "loss": 0.8721,
440
+ "mean_token_accuracy": 0.7794204503297806,
441
+ "num_tokens": 6484738.0,
442
+ "step": 480
443
+ },
444
+ {
445
+ "epoch": 0.2984165651644336,
446
+ "grad_norm": 0.5541098117828369,
447
+ "learning_rate": 0.0001977472728103005,
448
+ "loss": 0.8785,
449
+ "mean_token_accuracy": 0.7767582029104233,
450
+ "num_tokens": 6619313.0,
451
+ "step": 490
452
+ },
453
+ {
454
+ "epoch": 0.30450669914738127,
455
+ "grad_norm": 0.5134281516075134,
456
+ "learning_rate": 0.0001976138062152419,
457
+ "loss": 0.8717,
458
+ "mean_token_accuracy": 0.7752724394202233,
459
+ "num_tokens": 6753195.0,
460
+ "step": 500
461
+ },
462
+ {
463
+ "epoch": 0.3105968331303289,
464
+ "grad_norm": 0.49164435267448425,
465
+ "learning_rate": 0.00019747655189520633,
466
+ "loss": 0.8757,
467
+ "mean_token_accuracy": 0.7768464118242264,
468
+ "num_tokens": 6890448.0,
469
+ "step": 510
470
+ },
471
+ {
472
+ "epoch": 0.3166869671132765,
473
+ "grad_norm": 0.5899345278739929,
474
+ "learning_rate": 0.00019733551578398023,
475
+ "loss": 0.8322,
476
+ "mean_token_accuracy": 0.7859320402145386,
477
+ "num_tokens": 7027488.0,
478
+ "step": 520
479
+ },
480
+ {
481
+ "epoch": 0.3227771010962241,
482
+ "grad_norm": 0.6552841663360596,
483
+ "learning_rate": 0.0001971907039788447,
484
+ "loss": 0.861,
485
+ "mean_token_accuracy": 0.7770532324910164,
486
+ "num_tokens": 7161184.0,
487
+ "step": 530
488
+ },
489
+ {
490
+ "epoch": 0.32886723507917176,
491
+ "grad_norm": 0.5038822889328003,
492
+ "learning_rate": 0.0001970421227403117,
493
+ "loss": 0.8825,
494
+ "mean_token_accuracy": 0.775890800356865,
495
+ "num_tokens": 7294399.0,
496
+ "step": 540
497
+ },
498
+ {
499
+ "epoch": 0.33495736906211937,
500
+ "grad_norm": 0.5094267129898071,
501
+ "learning_rate": 0.00019688977849185378,
502
+ "loss": 0.8598,
503
+ "mean_token_accuracy": 0.7817838475108146,
504
+ "num_tokens": 7427183.0,
505
+ "step": 550
506
+ },
507
+ {
508
+ "epoch": 0.341047503045067,
509
+ "grad_norm": 0.5282809138298035,
510
+ "learning_rate": 0.00019673367781962594,
511
+ "loss": 0.8463,
512
+ "mean_token_accuracy": 0.7812959104776382,
513
+ "num_tokens": 7561734.0,
514
+ "step": 560
515
+ },
516
+ {
517
+ "epoch": 0.3471376370280146,
518
+ "grad_norm": 0.45355409383773804,
519
+ "learning_rate": 0.00019657382747218123,
520
+ "loss": 0.8207,
521
+ "mean_token_accuracy": 0.7888262197375298,
522
+ "num_tokens": 7706228.0,
523
+ "step": 570
524
+ },
525
+ {
526
+ "epoch": 0.35322777101096225,
527
+ "grad_norm": 0.5162333846092224,
528
+ "learning_rate": 0.00019641023436017883,
529
+ "loss": 0.8235,
530
+ "mean_token_accuracy": 0.7868947923183441,
531
+ "num_tokens": 7846684.0,
532
+ "step": 580
533
+ },
534
+ {
535
+ "epoch": 0.35931790499390986,
536
+ "grad_norm": 0.5194632411003113,
537
+ "learning_rate": 0.00019624290555608526,
538
+ "loss": 0.8129,
539
+ "mean_token_accuracy": 0.7884069249033928,
540
+ "num_tokens": 7986811.0,
541
+ "step": 590
542
+ },
543
+ {
544
+ "epoch": 0.3654080389768575,
545
+ "grad_norm": 0.5494846701622009,
546
+ "learning_rate": 0.00019607184829386882,
547
+ "loss": 0.8084,
548
+ "mean_token_accuracy": 0.7874000474810601,
549
+ "num_tokens": 8124538.0,
550
+ "step": 600
551
+ },
552
+ {
553
+ "epoch": 0.37149817295980514,
554
+ "grad_norm": 0.5368776917457581,
555
+ "learning_rate": 0.0001958970699686866,
556
+ "loss": 0.8225,
557
+ "mean_token_accuracy": 0.783010233938694,
558
+ "num_tokens": 8260529.0,
559
+ "step": 610
560
+ },
561
+ {
562
+ "epoch": 0.37758830694275275,
563
+ "grad_norm": 0.6229024529457092,
564
+ "learning_rate": 0.00019571857813656496,
565
+ "loss": 0.8786,
566
+ "mean_token_accuracy": 0.7753148928284646,
567
+ "num_tokens": 8389042.0,
568
+ "step": 620
569
+ },
570
+ {
571
+ "epoch": 0.38367844092570036,
572
+ "grad_norm": 0.5601000785827637,
573
+ "learning_rate": 0.00019553638051407279,
574
+ "loss": 0.8909,
575
+ "mean_token_accuracy": 0.7745720192790031,
576
+ "num_tokens": 8513603.0,
577
+ "step": 630
578
+ },
579
+ {
580
+ "epoch": 0.38976857490864797,
581
+ "grad_norm": 0.438970685005188,
582
+ "learning_rate": 0.0001953504849779879,
583
+ "loss": 0.8085,
584
+ "mean_token_accuracy": 0.7871840804815292,
585
+ "num_tokens": 8652970.0,
586
+ "step": 640
587
+ },
588
+ {
589
+ "epoch": 0.39585870889159563,
590
+ "grad_norm": 0.5505132079124451,
591
+ "learning_rate": 0.00019516089956495648,
592
+ "loss": 0.8102,
593
+ "mean_token_accuracy": 0.7869585514068603,
594
+ "num_tokens": 8792103.0,
595
+ "step": 650
596
+ },
597
+ {
598
+ "epoch": 0.40194884287454324,
599
+ "grad_norm": 0.5447221398353577,
600
+ "learning_rate": 0.00019496763247114581,
601
+ "loss": 0.8336,
602
+ "mean_token_accuracy": 0.7816034242510795,
603
+ "num_tokens": 8926853.0,
604
+ "step": 660
605
+ },
606
+ {
607
+ "epoch": 0.40803897685749085,
608
+ "grad_norm": 0.4652746915817261,
609
+ "learning_rate": 0.00019477069205188965,
610
+ "loss": 0.8383,
611
+ "mean_token_accuracy": 0.7826304718852043,
612
+ "num_tokens": 9059592.0,
613
+ "step": 670
614
+ },
615
+ {
616
+ "epoch": 0.41412911084043846,
617
+ "grad_norm": 0.42363590002059937,
618
+ "learning_rate": 0.00019457008682132726,
619
+ "loss": 0.847,
620
+ "mean_token_accuracy": 0.7810002073645592,
621
+ "num_tokens": 9193062.0,
622
+ "step": 680
623
+ },
624
+ {
625
+ "epoch": 0.42021924482338613,
626
+ "grad_norm": 0.5209478735923767,
627
+ "learning_rate": 0.00019436582545203518,
628
+ "loss": 0.8766,
629
+ "mean_token_accuracy": 0.7733785718679428,
630
+ "num_tokens": 9315805.0,
631
+ "step": 690
632
+ },
633
+ {
634
+ "epoch": 0.42630937880633374,
635
+ "grad_norm": 0.5176642537117004,
636
+ "learning_rate": 0.00019415791677465237,
637
+ "loss": 0.8155,
638
+ "mean_token_accuracy": 0.7869213685393334,
639
+ "num_tokens": 9448863.0,
640
+ "step": 700
641
+ },
642
+ {
643
+ "epoch": 0.43239951278928135,
644
+ "grad_norm": 0.4531058371067047,
645
+ "learning_rate": 0.00019394636977749843,
646
+ "loss": 0.8096,
647
+ "mean_token_accuracy": 0.7903949975967407,
648
+ "num_tokens": 9589382.0,
649
+ "step": 710
650
+ },
651
+ {
652
+ "epoch": 0.438489646772229,
653
+ "grad_norm": 0.5651549100875854,
654
+ "learning_rate": 0.000193731193606185,
655
+ "loss": 0.8263,
656
+ "mean_token_accuracy": 0.7823062822222709,
657
+ "num_tokens": 9723562.0,
658
+ "step": 720
659
+ },
660
+ {
661
+ "epoch": 0.4445797807551766,
662
+ "grad_norm": 0.5377989411354065,
663
+ "learning_rate": 0.00019351239756322031,
664
+ "loss": 0.7993,
665
+ "mean_token_accuracy": 0.7908329650759697,
666
+ "num_tokens": 9859255.0,
667
+ "step": 730
668
+ },
669
+ {
670
+ "epoch": 0.45066991473812423,
671
+ "grad_norm": 0.5420868396759033,
672
+ "learning_rate": 0.00019328999110760722,
673
+ "loss": 0.8461,
674
+ "mean_token_accuracy": 0.7780480548739434,
675
+ "num_tokens": 9981578.0,
676
+ "step": 740
677
+ },
678
+ {
679
+ "epoch": 0.45676004872107184,
680
+ "grad_norm": 0.4889216125011444,
681
+ "learning_rate": 0.000193063983854434,
682
+ "loss": 0.7652,
683
+ "mean_token_accuracy": 0.7959530428051949,
684
+ "num_tokens": 10122922.0,
685
+ "step": 750
686
+ },
687
+ {
688
+ "epoch": 0.4628501827040195,
689
+ "grad_norm": 0.5044087767601013,
690
+ "learning_rate": 0.00019283438557445893,
691
+ "loss": 0.824,
692
+ "mean_token_accuracy": 0.7845935523509979,
693
+ "num_tokens": 10252854.0,
694
+ "step": 760
695
+ },
696
+ {
697
+ "epoch": 0.4689403166869671,
698
+ "grad_norm": 0.5286466479301453,
699
+ "learning_rate": 0.00019260120619368773,
700
+ "loss": 0.815,
701
+ "mean_token_accuracy": 0.7850656941533088,
702
+ "num_tokens": 10385075.0,
703
+ "step": 770
704
+ },
705
+ {
706
+ "epoch": 0.47503045066991473,
707
+ "grad_norm": 0.5441628694534302,
708
+ "learning_rate": 0.00019236445579294437,
709
+ "loss": 0.8048,
710
+ "mean_token_accuracy": 0.7876680314540863,
711
+ "num_tokens": 10520011.0,
712
+ "step": 780
713
+ },
714
+ {
715
+ "epoch": 0.48112058465286234,
716
+ "grad_norm": 0.49002447724342346,
717
+ "learning_rate": 0.0001921241446074355,
718
+ "loss": 0.8059,
719
+ "mean_token_accuracy": 0.7898563235998154,
720
+ "num_tokens": 10652488.0,
721
+ "step": 790
722
+ },
723
+ {
724
+ "epoch": 0.48721071863581,
725
+ "grad_norm": 0.4479144811630249,
726
+ "learning_rate": 0.0001918802830263077,
727
+ "loss": 0.7913,
728
+ "mean_token_accuracy": 0.7928732186555862,
729
+ "num_tokens": 10785974.0,
730
+ "step": 800
731
+ },
732
+ {
733
+ "epoch": 0.4933008526187576,
734
+ "grad_norm": 0.5007497668266296,
735
+ "learning_rate": 0.00019163288159219853,
736
+ "loss": 0.8083,
737
+ "mean_token_accuracy": 0.7893043681979179,
738
+ "num_tokens": 10920950.0,
739
+ "step": 810
740
+ },
741
+ {
742
+ "epoch": 0.4993909866017052,
743
+ "grad_norm": 0.5289483070373535,
744
+ "learning_rate": 0.00019138195100078064,
745
+ "loss": 0.8033,
746
+ "mean_token_accuracy": 0.7864485770463944,
747
+ "num_tokens": 11056380.0,
748
+ "step": 820
749
+ },
750
+ {
751
+ "epoch": 0.5054811205846529,
752
+ "grad_norm": 0.5604159832000732,
753
+ "learning_rate": 0.0001911275021002994,
754
+ "loss": 0.7652,
755
+ "mean_token_accuracy": 0.7946401730179786,
756
+ "num_tokens": 11196074.0,
757
+ "step": 830
758
+ },
759
+ {
760
+ "epoch": 0.5115712545676004,
761
+ "grad_norm": 0.43645399808883667,
762
+ "learning_rate": 0.00019086954589110397,
763
+ "loss": 0.7724,
764
+ "mean_token_accuracy": 0.7990294560790062,
765
+ "num_tokens": 11337990.0,
766
+ "step": 840
767
+ },
768
+ {
769
+ "epoch": 0.5176613885505481,
770
+ "grad_norm": 0.43992146849632263,
771
+ "learning_rate": 0.0001906080935251716,
772
+ "loss": 0.7612,
773
+ "mean_token_accuracy": 0.7999786615371705,
774
+ "num_tokens": 11481565.0,
775
+ "step": 850
776
+ },
777
+ {
778
+ "epoch": 0.5237515225334958,
779
+ "grad_norm": 0.5595120191574097,
780
+ "learning_rate": 0.0001903431563056256,
781
+ "loss": 0.8266,
782
+ "mean_token_accuracy": 0.7859750911593437,
783
+ "num_tokens": 11611714.0,
784
+ "step": 860
785
+ },
786
+ {
787
+ "epoch": 0.5298416565164433,
788
+ "grad_norm": 0.5001987218856812,
789
+ "learning_rate": 0.0001900747456862467,
790
+ "loss": 0.8506,
791
+ "mean_token_accuracy": 0.779585388302803,
792
+ "num_tokens": 11736573.0,
793
+ "step": 870
794
+ },
795
+ {
796
+ "epoch": 0.535931790499391,
797
+ "grad_norm": 0.430147647857666,
798
+ "learning_rate": 0.00018980287327097784,
799
+ "loss": 0.7707,
800
+ "mean_token_accuracy": 0.795211361348629,
801
+ "num_tokens": 11876859.0,
802
+ "step": 880
803
+ },
804
+ {
805
+ "epoch": 0.5420219244823387,
806
+ "grad_norm": 0.5346289873123169,
807
+ "learning_rate": 0.00018952755081342245,
808
+ "loss": 0.8057,
809
+ "mean_token_accuracy": 0.7871127843856811,
810
+ "num_tokens": 12007654.0,
811
+ "step": 890
812
+ },
813
+ {
814
+ "epoch": 0.5481120584652862,
815
+ "grad_norm": 0.46072253584861755,
816
+ "learning_rate": 0.00018924879021633653,
817
+ "loss": 0.7924,
818
+ "mean_token_accuracy": 0.7913773030042648,
819
+ "num_tokens": 12140520.0,
820
+ "step": 900
821
+ },
822
+ {
823
+ "epoch": 0.5542021924482339,
824
+ "grad_norm": 0.4803653955459595,
825
+ "learning_rate": 0.00018896660353111375,
826
+ "loss": 0.8398,
827
+ "mean_token_accuracy": 0.7807079553604126,
828
+ "num_tokens": 12267219.0,
829
+ "step": 910
830
+ },
831
+ {
832
+ "epoch": 0.5602923264311814,
833
+ "grad_norm": 0.5219636559486389,
834
+ "learning_rate": 0.0001886810029572647,
835
+ "loss": 0.7612,
836
+ "mean_token_accuracy": 0.7993015512824059,
837
+ "num_tokens": 12404646.0,
838
+ "step": 920
839
+ },
840
+ {
841
+ "epoch": 0.5663824604141291,
842
+ "grad_norm": 0.501483142375946,
843
+ "learning_rate": 0.00018839200084188936,
844
+ "loss": 0.7953,
845
+ "mean_token_accuracy": 0.787814213335514,
846
+ "num_tokens": 12538219.0,
847
+ "step": 930
848
+ },
849
+ {
850
+ "epoch": 0.5724725943970768,
851
+ "grad_norm": 0.47334522008895874,
852
+ "learning_rate": 0.00018809960967914346,
853
+ "loss": 0.789,
854
+ "mean_token_accuracy": 0.7928574904799461,
855
+ "num_tokens": 12673805.0,
856
+ "step": 940
857
+ },
858
+ {
859
+ "epoch": 0.5785627283800243,
860
+ "grad_norm": 0.5057492852210999,
861
+ "learning_rate": 0.00018780384210969806,
862
+ "loss": 0.7746,
863
+ "mean_token_accuracy": 0.7947553545236588,
864
+ "num_tokens": 12811727.0,
865
+ "step": 950
866
+ },
867
+ {
868
+ "epoch": 0.584652862362972,
869
+ "grad_norm": 0.5179910659790039,
870
+ "learning_rate": 0.00018750471092019325,
871
+ "loss": 0.7962,
872
+ "mean_token_accuracy": 0.7905686929821968,
873
+ "num_tokens": 12947641.0,
874
+ "step": 960
875
+ },
876
+ {
877
+ "epoch": 0.5907429963459196,
878
+ "grad_norm": 0.45797088742256165,
879
+ "learning_rate": 0.00018720222904268543,
880
+ "loss": 0.7678,
881
+ "mean_token_accuracy": 0.7969774708151818,
882
+ "num_tokens": 13083869.0,
883
+ "step": 970
884
+ },
885
+ {
886
+ "epoch": 0.5968331303288672,
887
+ "grad_norm": 0.48360612988471985,
888
+ "learning_rate": 0.00018689640955408803,
889
+ "loss": 0.7996,
890
+ "mean_token_accuracy": 0.7885591968894005,
891
+ "num_tokens": 13211807.0,
892
+ "step": 980
893
+ },
894
+ {
895
+ "epoch": 0.6029232643118149,
896
+ "grad_norm": 0.4378497004508972,
897
+ "learning_rate": 0.00018658726567560635,
898
+ "loss": 0.7652,
899
+ "mean_token_accuracy": 0.7969291344285011,
900
+ "num_tokens": 13351856.0,
901
+ "step": 990
902
+ },
903
+ {
904
+ "epoch": 0.6090133982947625,
905
+ "grad_norm": 0.4857536852359772,
906
+ "learning_rate": 0.00018627481077216577,
907
+ "loss": 0.7786,
908
+ "mean_token_accuracy": 0.7914443418383599,
909
+ "num_tokens": 13486443.0,
910
+ "step": 1000
911
+ },
912
+ {
913
+ "epoch": 0.6151035322777101,
914
+ "grad_norm": 0.5233064293861389,
915
+ "learning_rate": 0.0001859590583518343,
916
+ "loss": 0.8241,
917
+ "mean_token_accuracy": 0.7811850637197495,
918
+ "num_tokens": 13612035.0,
919
+ "step": 1010
920
+ },
921
+ {
922
+ "epoch": 0.6211936662606578,
923
+ "grad_norm": 0.5328738689422607,
924
+ "learning_rate": 0.00018564002206523816,
925
+ "loss": 0.7502,
926
+ "mean_token_accuracy": 0.7993430674076081,
927
+ "num_tokens": 13756509.0,
928
+ "step": 1020
929
+ },
930
+ {
931
+ "epoch": 0.6272838002436053,
932
+ "grad_norm": 0.47962310910224915,
933
+ "learning_rate": 0.000185317715704972,
934
+ "loss": 0.7984,
935
+ "mean_token_accuracy": 0.7864531084895134,
936
+ "num_tokens": 13883033.0,
937
+ "step": 1030
938
+ },
939
+ {
940
+ "epoch": 0.633373934226553,
941
+ "grad_norm": 0.5685893893241882,
942
+ "learning_rate": 0.0001849921532050024,
943
+ "loss": 0.7869,
944
+ "mean_token_accuracy": 0.7909937381744385,
945
+ "num_tokens": 14015234.0,
946
+ "step": 1040
947
+ },
948
+ {
949
+ "epoch": 0.6394640682095006,
950
+ "grad_norm": 0.49146631360054016,
951
+ "learning_rate": 0.00018466334864006566,
952
+ "loss": 0.7952,
953
+ "mean_token_accuracy": 0.7878949210047722,
954
+ "num_tokens": 14149319.0,
955
+ "step": 1050
956
+ },
957
+ {
958
+ "epoch": 0.6455542021924482,
959
+ "grad_norm": 0.5556225776672363,
960
+ "learning_rate": 0.0001843313162250591,
961
+ "loss": 0.7524,
962
+ "mean_token_accuracy": 0.7994373366236687,
963
+ "num_tokens": 14286868.0,
964
+ "step": 1060
965
+ },
966
+ {
967
+ "epoch": 0.6516443361753959,
968
+ "grad_norm": 0.511379063129425,
969
+ "learning_rate": 0.00018399607031442666,
970
+ "loss": 0.7929,
971
+ "mean_token_accuracy": 0.7921562284231186,
972
+ "num_tokens": 14418354.0,
973
+ "step": 1070
974
+ },
975
+ {
976
+ "epoch": 0.6577344701583435,
977
+ "grad_norm": 0.5019840598106384,
978
+ "learning_rate": 0.00018365762540153836,
979
+ "loss": 0.758,
980
+ "mean_token_accuracy": 0.7989353060722351,
981
+ "num_tokens": 14553174.0,
982
+ "step": 1080
983
+ },
984
+ {
985
+ "epoch": 0.6638246041412911,
986
+ "grad_norm": 0.6032467484474182,
987
+ "learning_rate": 0.00018331599611806366,
988
+ "loss": 0.7888,
989
+ "mean_token_accuracy": 0.7903819754719734,
990
+ "num_tokens": 14681393.0,
991
+ "step": 1090
992
+ },
993
+ {
994
+ "epoch": 0.6699147381242387,
995
+ "grad_norm": 0.5369830131530762,
996
+ "learning_rate": 0.00018297119723333877,
997
+ "loss": 0.765,
998
+ "mean_token_accuracy": 0.7950262635946274,
999
+ "num_tokens": 14814565.0,
1000
+ "step": 1100
1001
+ },
1002
+ {
1003
+ "epoch": 0.6760048721071864,
1004
+ "grad_norm": 0.5289803743362427,
1005
+ "learning_rate": 0.00018262324365372846,
1006
+ "loss": 0.7496,
1007
+ "mean_token_accuracy": 0.8032818242907525,
1008
+ "num_tokens": 14954351.0,
1009
+ "step": 1110
1010
+ },
1011
+ {
1012
+ "epoch": 0.682095006090134,
1013
+ "grad_norm": 0.5440439581871033,
1014
+ "learning_rate": 0.0001822721504219814,
1015
+ "loss": 0.7432,
1016
+ "mean_token_accuracy": 0.799126236140728,
1017
+ "num_tokens": 15094879.0,
1018
+ "step": 1120
1019
+ },
1020
+ {
1021
+ "epoch": 0.6881851400730816,
1022
+ "grad_norm": 0.46225935220718384,
1023
+ "learning_rate": 0.00018191793271657978,
1024
+ "loss": 0.7513,
1025
+ "mean_token_accuracy": 0.8022688791155815,
1026
+ "num_tokens": 15234906.0,
1027
+ "step": 1130
1028
+ },
1029
+ {
1030
+ "epoch": 0.6942752740560292,
1031
+ "grad_norm": 0.5592020750045776,
1032
+ "learning_rate": 0.0001815606058510833,
1033
+ "loss": 0.7583,
1034
+ "mean_token_accuracy": 0.7984497547149658,
1035
+ "num_tokens": 15373526.0,
1036
+ "step": 1140
1037
+ },
1038
+ {
1039
+ "epoch": 0.7003654080389768,
1040
+ "grad_norm": 0.525090217590332,
1041
+ "learning_rate": 0.00018120018527346702,
1042
+ "loss": 0.7254,
1043
+ "mean_token_accuracy": 0.8070619881153107,
1044
+ "num_tokens": 15516264.0,
1045
+ "step": 1150
1046
+ },
1047
+ {
1048
+ "epoch": 0.7064555420219245,
1049
+ "grad_norm": 0.5380759239196777,
1050
+ "learning_rate": 0.00018083668656545355,
1051
+ "loss": 0.8041,
1052
+ "mean_token_accuracy": 0.7866759791970253,
1053
+ "num_tokens": 15640444.0,
1054
+ "step": 1160
1055
+ },
1056
+ {
1057
+ "epoch": 0.7125456760048721,
1058
+ "grad_norm": 0.47815701365470886,
1059
+ "learning_rate": 0.00018047012544183938,
1060
+ "loss": 0.7604,
1061
+ "mean_token_accuracy": 0.796156468987465,
1062
+ "num_tokens": 15778070.0,
1063
+ "step": 1170
1064
+ },
1065
+ {
1066
+ "epoch": 0.7186358099878197,
1067
+ "grad_norm": 0.5380450487136841,
1068
+ "learning_rate": 0.00018010051774981553,
1069
+ "loss": 0.8135,
1070
+ "mean_token_accuracy": 0.7842124432325364,
1071
+ "num_tokens": 15899739.0,
1072
+ "step": 1180
1073
+ },
1074
+ {
1075
+ "epoch": 0.7247259439707674,
1076
+ "grad_norm": 0.5047502517700195,
1077
+ "learning_rate": 0.00017972787946828246,
1078
+ "loss": 0.7642,
1079
+ "mean_token_accuracy": 0.7989341139793396,
1080
+ "num_tokens": 16035805.0,
1081
+ "step": 1190
1082
+ },
1083
+ {
1084
+ "epoch": 0.730816077953715,
1085
+ "grad_norm": 0.5440967679023743,
1086
+ "learning_rate": 0.00017935222670715918,
1087
+ "loss": 0.735,
1088
+ "mean_token_accuracy": 0.8048294603824615,
1089
+ "num_tokens": 16172541.0,
1090
+ "step": 1200
1091
+ },
1092
+ {
1093
+ "epoch": 0.7369062119366626,
1094
+ "grad_norm": 0.4766077399253845,
1095
+ "learning_rate": 0.000178973575706687,
1096
+ "loss": 0.805,
1097
+ "mean_token_accuracy": 0.7871790423989296,
1098
+ "num_tokens": 16296988.0,
1099
+ "step": 1210
1100
+ },
1101
+ {
1102
+ "epoch": 0.7429963459196103,
1103
+ "grad_norm": 0.4153214991092682,
1104
+ "learning_rate": 0.00017859194283672704,
1105
+ "loss": 0.7635,
1106
+ "mean_token_accuracy": 0.7964595645666123,
1107
+ "num_tokens": 16432022.0,
1108
+ "step": 1220
1109
+ },
1110
+ {
1111
+ "epoch": 0.7490864799025578,
1112
+ "grad_norm": 0.4698518216609955,
1113
+ "learning_rate": 0.00017820734459605302,
1114
+ "loss": 0.7397,
1115
+ "mean_token_accuracy": 0.8046972885727882,
1116
+ "num_tokens": 16572880.0,
1117
+ "step": 1230
1118
+ },
1119
+ {
1120
+ "epoch": 0.7551766138855055,
1121
+ "grad_norm": 0.46101540327072144,
1122
+ "learning_rate": 0.00017781979761163756,
1123
+ "loss": 0.7174,
1124
+ "mean_token_accuracy": 0.8066875368356705,
1125
+ "num_tokens": 16714419.0,
1126
+ "step": 1240
1127
+ },
1128
+ {
1129
+ "epoch": 0.761266747868453,
1130
+ "grad_norm": 0.5313341021537781,
1131
+ "learning_rate": 0.00017742931863793358,
1132
+ "loss": 0.7797,
1133
+ "mean_token_accuracy": 0.7911526098847389,
1134
+ "num_tokens": 16838285.0,
1135
+ "step": 1250
1136
+ },
1137
+ {
1138
+ "epoch": 0.7673568818514007,
1139
+ "grad_norm": 0.4627362787723541,
1140
+ "learning_rate": 0.00017703592455614998,
1141
+ "loss": 0.7626,
1142
+ "mean_token_accuracy": 0.7970306649804115,
1143
+ "num_tokens": 16976065.0,
1144
+ "step": 1260
1145
+ },
1146
+ {
1147
+ "epoch": 0.7734470158343484,
1148
+ "grad_norm": 0.5429073572158813,
1149
+ "learning_rate": 0.00017663963237352177,
1150
+ "loss": 0.7398,
1151
+ "mean_token_accuracy": 0.8005403786897659,
1152
+ "num_tokens": 17112901.0,
1153
+ "step": 1270
1154
+ },
1155
+ {
1156
+ "epoch": 0.7795371498172959,
1157
+ "grad_norm": 0.6781270503997803,
1158
+ "learning_rate": 0.00017624045922257471,
1159
+ "loss": 0.7607,
1160
+ "mean_token_accuracy": 0.7946217939257622,
1161
+ "num_tokens": 17245480.0,
1162
+ "step": 1280
1163
+ },
1164
+ {
1165
+ "epoch": 0.7856272838002436,
1166
+ "grad_norm": 0.5227305293083191,
1167
+ "learning_rate": 0.00017583842236038483,
1168
+ "loss": 0.7217,
1169
+ "mean_token_accuracy": 0.8064659267663956,
1170
+ "num_tokens": 17387171.0,
1171
+ "step": 1290
1172
+ },
1173
+ {
1174
+ "epoch": 0.7917174177831913,
1175
+ "grad_norm": 0.49253156781196594,
1176
+ "learning_rate": 0.0001754335391678323,
1177
+ "loss": 0.7652,
1178
+ "mean_token_accuracy": 0.7960015773773194,
1179
+ "num_tokens": 17521164.0,
1180
+ "step": 1300
1181
+ },
1182
+ {
1183
+ "epoch": 0.7978075517661388,
1184
+ "grad_norm": 0.5103631615638733,
1185
+ "learning_rate": 0.00017502582714884997,
1186
+ "loss": 0.7435,
1187
+ "mean_token_accuracy": 0.7995276898145676,
1188
+ "num_tokens": 17657818.0,
1189
+ "step": 1310
1190
+ },
1191
+ {
1192
+ "epoch": 0.8038976857490865,
1193
+ "grad_norm": 0.5531247854232788,
1194
+ "learning_rate": 0.00017461530392966665,
1195
+ "loss": 0.7986,
1196
+ "mean_token_accuracy": 0.7892467245459557,
1197
+ "num_tokens": 17784361.0,
1198
+ "step": 1320
1199
+ },
1200
+ {
1201
+ "epoch": 0.8099878197320342,
1202
+ "grad_norm": 0.4574586749076843,
1203
+ "learning_rate": 0.00017420198725804517,
1204
+ "loss": 0.6889,
1205
+ "mean_token_accuracy": 0.8135112956166267,
1206
+ "num_tokens": 17929664.0,
1207
+ "step": 1330
1208
+ },
1209
+ {
1210
+ "epoch": 0.8160779537149817,
1211
+ "grad_norm": 0.4734383225440979,
1212
+ "learning_rate": 0.00017378589500251498,
1213
+ "loss": 0.7308,
1214
+ "mean_token_accuracy": 0.8029947131872177,
1215
+ "num_tokens": 18071182.0,
1216
+ "step": 1340
1217
+ },
1218
+ {
1219
+ "epoch": 0.8221680876979294,
1220
+ "grad_norm": 0.5192279815673828,
1221
+ "learning_rate": 0.00017336704515159986,
1222
+ "loss": 0.7444,
1223
+ "mean_token_accuracy": 0.8012512847781181,
1224
+ "num_tokens": 18211136.0,
1225
+ "step": 1350
1226
+ },
1227
+ {
1228
+ "epoch": 0.8282582216808769,
1229
+ "grad_norm": 0.5378620624542236,
1230
+ "learning_rate": 0.00017294545581303996,
1231
+ "loss": 0.7459,
1232
+ "mean_token_accuracy": 0.7981989249587059,
1233
+ "num_tokens": 18340645.0,
1234
+ "step": 1360
1235
+ },
1236
+ {
1237
+ "epoch": 0.8343483556638246,
1238
+ "grad_norm": 0.4879571497440338,
1239
+ "learning_rate": 0.00017252114521300918,
1240
+ "loss": 0.7877,
1241
+ "mean_token_accuracy": 0.7891893342137337,
1242
+ "num_tokens": 18465733.0,
1243
+ "step": 1370
1244
+ },
1245
+ {
1246
+ "epoch": 0.8404384896467723,
1247
+ "grad_norm": 0.5297388434410095,
1248
+ "learning_rate": 0.00017209413169532717,
1249
+ "loss": 0.7586,
1250
+ "mean_token_accuracy": 0.797142505645752,
1251
+ "num_tokens": 18598979.0,
1252
+ "step": 1380
1253
+ },
1254
+ {
1255
+ "epoch": 0.8465286236297198,
1256
+ "grad_norm": 0.5308396220207214,
1257
+ "learning_rate": 0.00017166443372066618,
1258
+ "loss": 0.7387,
1259
+ "mean_token_accuracy": 0.80123979896307,
1260
+ "num_tokens": 18735919.0,
1261
+ "step": 1390
1262
+ },
1263
+ {
1264
+ "epoch": 0.8526187576126675,
1265
+ "grad_norm": 0.49988579750061035,
1266
+ "learning_rate": 0.0001712320698657532,
1267
+ "loss": 0.7425,
1268
+ "mean_token_accuracy": 0.7996803268790245,
1269
+ "num_tokens": 18870877.0,
1270
+ "step": 1400
1271
+ },
1272
+ {
1273
+ "epoch": 0.8587088915956151,
1274
+ "grad_norm": 0.5971361994743347,
1275
+ "learning_rate": 0.0001707970588225665,
1276
+ "loss": 0.7691,
1277
+ "mean_token_accuracy": 0.7922965154051781,
1278
+ "num_tokens": 19000943.0,
1279
+ "step": 1410
1280
+ },
1281
+ {
1282
+ "epoch": 0.8647990255785627,
1283
+ "grad_norm": 0.5141698718070984,
1284
+ "learning_rate": 0.00017035941939752802,
1285
+ "loss": 0.7203,
1286
+ "mean_token_accuracy": 0.8036229625344277,
1287
+ "num_tokens": 19135039.0,
1288
+ "step": 1420
1289
+ },
1290
+ {
1291
+ "epoch": 0.8708891595615104,
1292
+ "grad_norm": 0.4647749066352844,
1293
+ "learning_rate": 0.0001699191705106898,
1294
+ "loss": 0.7136,
1295
+ "mean_token_accuracy": 0.8064323276281357,
1296
+ "num_tokens": 19274069.0,
1297
+ "step": 1430
1298
+ },
1299
+ {
1300
+ "epoch": 0.876979293544458,
1301
+ "grad_norm": 0.5511934161186218,
1302
+ "learning_rate": 0.00016947633119491633,
1303
+ "loss": 0.7455,
1304
+ "mean_token_accuracy": 0.7985599264502525,
1305
+ "num_tokens": 19409679.0,
1306
+ "step": 1440
1307
+ },
1308
+ {
1309
+ "epoch": 0.8830694275274056,
1310
+ "grad_norm": 0.4936945140361786,
1311
+ "learning_rate": 0.00016903092059506182,
1312
+ "loss": 0.7087,
1313
+ "mean_token_accuracy": 0.806523185968399,
1314
+ "num_tokens": 19547419.0,
1315
+ "step": 1450
1316
+ },
1317
+ {
1318
+ "epoch": 0.8891595615103532,
1319
+ "grad_norm": 0.5227787494659424,
1320
+ "learning_rate": 0.00016858295796714213,
1321
+ "loss": 0.7739,
1322
+ "mean_token_accuracy": 0.7941467314958572,
1323
+ "num_tokens": 19674455.0,
1324
+ "step": 1460
1325
+ },
1326
+ {
1327
+ "epoch": 0.8952496954933008,
1328
+ "grad_norm": 0.5046219825744629,
1329
+ "learning_rate": 0.00016813246267750282,
1330
+ "loss": 0.7361,
1331
+ "mean_token_accuracy": 0.8008369222283364,
1332
+ "num_tokens": 19809861.0,
1333
+ "step": 1470
1334
+ },
1335
+ {
1336
+ "epoch": 0.9013398294762485,
1337
+ "grad_norm": 0.4827081263065338,
1338
+ "learning_rate": 0.00016767945420198142,
1339
+ "loss": 0.7464,
1340
+ "mean_token_accuracy": 0.7986427888274192,
1341
+ "num_tokens": 19940696.0,
1342
+ "step": 1480
1343
+ },
1344
+ {
1345
+ "epoch": 0.9074299634591961,
1346
+ "grad_norm": 0.4970889687538147,
1347
+ "learning_rate": 0.00016722395212506567,
1348
+ "loss": 0.7528,
1349
+ "mean_token_accuracy": 0.7965970665216446,
1350
+ "num_tokens": 20070686.0,
1351
+ "step": 1490
1352
+ },
1353
+ {
1354
+ "epoch": 0.9135200974421437,
1355
+ "grad_norm": 0.44478070735931396,
1356
+ "learning_rate": 0.00016676597613904693,
1357
+ "loss": 0.7185,
1358
+ "mean_token_accuracy": 0.8081388726830483,
1359
+ "num_tokens": 20210260.0,
1360
+ "step": 1500
1361
+ },
1362
+ {
1363
+ "epoch": 0.9196102314250914,
1364
+ "grad_norm": 0.506136417388916,
1365
+ "learning_rate": 0.00016630554604316866,
1366
+ "loss": 0.7395,
1367
+ "mean_token_accuracy": 0.8003876298666001,
1368
+ "num_tokens": 20346235.0,
1369
+ "step": 1510
1370
+ },
1371
+ {
1372
+ "epoch": 0.925700365408039,
1373
+ "grad_norm": 0.500946044921875,
1374
+ "learning_rate": 0.00016584268174277053,
1375
+ "loss": 0.6889,
1376
+ "mean_token_accuracy": 0.8124501362442971,
1377
+ "num_tokens": 20481248.0,
1378
+ "step": 1520
1379
+ },
1380
+ {
1381
+ "epoch": 0.9317904993909866,
1382
+ "grad_norm": 0.48528990149497986,
1383
+ "learning_rate": 0.00016537740324842795,
1384
+ "loss": 0.7227,
1385
+ "mean_token_accuracy": 0.8041250064969063,
1386
+ "num_tokens": 20613531.0,
1387
+ "step": 1530
1388
+ },
1389
+ {
1390
+ "epoch": 0.9378806333739342,
1391
+ "grad_norm": 0.5070951581001282,
1392
+ "learning_rate": 0.00016490973067508674,
1393
+ "loss": 0.7091,
1394
+ "mean_token_accuracy": 0.8082544595003128,
1395
+ "num_tokens": 20750784.0,
1396
+ "step": 1540
1397
+ },
1398
+ {
1399
+ "epoch": 0.9439707673568819,
1400
+ "grad_norm": 0.5583120584487915,
1401
+ "learning_rate": 0.0001644396842411939,
1402
+ "loss": 0.7405,
1403
+ "mean_token_accuracy": 0.7992320343852043,
1404
+ "num_tokens": 20883646.0,
1405
+ "step": 1550
1406
+ },
1407
+ {
1408
+ "epoch": 0.9500609013398295,
1409
+ "grad_norm": 0.5099635124206543,
1410
+ "learning_rate": 0.00016396728426782312,
1411
+ "loss": 0.7103,
1412
+ "mean_token_accuracy": 0.8091216519474983,
1413
+ "num_tokens": 21025143.0,
1414
+ "step": 1560
1415
+ },
1416
+ {
1417
+ "epoch": 0.9561510353227771,
1418
+ "grad_norm": 0.5777808427810669,
1419
+ "learning_rate": 0.00016349255117779652,
1420
+ "loss": 0.7245,
1421
+ "mean_token_accuracy": 0.8023119494318962,
1422
+ "num_tokens": 21160014.0,
1423
+ "step": 1570
1424
+ },
1425
+ {
1426
+ "epoch": 0.9622411693057247,
1427
+ "grad_norm": 0.5206162333488464,
1428
+ "learning_rate": 0.0001630155054948016,
1429
+ "loss": 0.7185,
1430
+ "mean_token_accuracy": 0.8069521963596344,
1431
+ "num_tokens": 21299094.0,
1432
+ "step": 1580
1433
+ },
1434
+ {
1435
+ "epoch": 0.9683313032886723,
1436
+ "grad_norm": 0.5763202905654907,
1437
+ "learning_rate": 0.00016253616784250415,
1438
+ "loss": 0.7677,
1439
+ "mean_token_accuracy": 0.7927820891141891,
1440
+ "num_tokens": 21429252.0,
1441
+ "step": 1590
1442
+ },
1443
+ {
1444
+ "epoch": 0.97442143727162,
1445
+ "grad_norm": 0.5068426728248596,
1446
+ "learning_rate": 0.00016205455894365627,
1447
+ "loss": 0.7673,
1448
+ "mean_token_accuracy": 0.794715291261673,
1449
+ "num_tokens": 21556200.0,
1450
+ "step": 1600
1451
+ },
1452
+ {
1453
+ "epoch": 0.9805115712545676,
1454
+ "grad_norm": 0.46094459295272827,
1455
+ "learning_rate": 0.0001615706996192009,
1456
+ "loss": 0.771,
1457
+ "mean_token_accuracy": 0.7921045809984207,
1458
+ "num_tokens": 21681524.0,
1459
+ "step": 1610
1460
+ },
1461
+ {
1462
+ "epoch": 0.9866017052375152,
1463
+ "grad_norm": 0.5063546299934387,
1464
+ "learning_rate": 0.00016108461078737148,
1465
+ "loss": 0.7383,
1466
+ "mean_token_accuracy": 0.800596435368061,
1467
+ "num_tokens": 21814109.0,
1468
+ "step": 1620
1469
+ },
1470
+ {
1471
+ "epoch": 0.9926918392204629,
1472
+ "grad_norm": 0.5418652296066284,
1473
+ "learning_rate": 0.0001605963134627876,
1474
+ "loss": 0.7431,
1475
+ "mean_token_accuracy": 0.7994748756289483,
1476
+ "num_tokens": 21947346.0,
1477
+ "step": 1630
1478
+ },
1479
+ {
1480
+ "epoch": 0.9987819732034104,
1481
+ "grad_norm": 0.6195595264434814,
1482
+ "learning_rate": 0.0001601058287555465,
1483
+ "loss": 0.7294,
1484
+ "mean_token_accuracy": 0.8030684441328049,
1485
+ "num_tokens": 22081340.0,
1486
+ "step": 1640
1487
+ },
1488
+ {
1489
+ "epoch": 1.004872107186358,
1490
+ "grad_norm": 0.5930359363555908,
1491
+ "learning_rate": 0.00015961317787031054,
1492
+ "loss": 0.7387,
1493
+ "mean_token_accuracy": 0.8013696864247322,
1494
+ "num_tokens": 22206441.0,
1495
+ "step": 1650
1496
+ },
1497
+ {
1498
+ "epoch": 1.0109622411693058,
1499
+ "grad_norm": 0.4926474094390869,
1500
+ "learning_rate": 0.00015911838210539038,
1501
+ "loss": 0.6743,
1502
+ "mean_token_accuracy": 0.8141208037734031,
1503
+ "num_tokens": 22344898.0,
1504
+ "step": 1660
1505
+ },
1506
+ {
1507
+ "epoch": 1.0170523751522533,
1508
+ "grad_norm": 0.5331000685691833,
1509
+ "learning_rate": 0.0001586214628518242,
1510
+ "loss": 0.7033,
1511
+ "mean_token_accuracy": 0.807385990023613,
1512
+ "num_tokens": 22483135.0,
1513
+ "step": 1670
1514
+ },
1515
+ {
1516
+ "epoch": 1.0231425091352009,
1517
+ "grad_norm": 0.5267267227172852,
1518
+ "learning_rate": 0.0001581224415924531,
1519
+ "loss": 0.6717,
1520
+ "mean_token_accuracy": 0.8178876608610153,
1521
+ "num_tokens": 22617934.0,
1522
+ "step": 1680
1523
+ },
1524
+ {
1525
+ "epoch": 1.0292326431181487,
1526
+ "grad_norm": 0.5864041447639465,
1527
+ "learning_rate": 0.00015762133990099205,
1528
+ "loss": 0.7421,
1529
+ "mean_token_accuracy": 0.7981289237737655,
1530
+ "num_tokens": 22745190.0,
1531
+ "step": 1690
1532
+ },
1533
+ {
1534
+ "epoch": 1.0353227771010962,
1535
+ "grad_norm": 0.45681944489479065,
1536
+ "learning_rate": 0.00015711817944109738,
1537
+ "loss": 0.6646,
1538
+ "mean_token_accuracy": 0.8146520599722862,
1539
+ "num_tokens": 22887536.0,
1540
+ "step": 1700
1541
+ },
1542
+ {
1543
+ "epoch": 1.0414129110840438,
1544
+ "grad_norm": 0.5522484183311462,
1545
+ "learning_rate": 0.00015661298196543042,
1546
+ "loss": 0.6889,
1547
+ "mean_token_accuracy": 0.8100781336426734,
1548
+ "num_tokens": 23017586.0,
1549
+ "step": 1710
1550
+ },
1551
+ {
1552
+ "epoch": 1.0475030450669915,
1553
+ "grad_norm": 0.5221629738807678,
1554
+ "learning_rate": 0.00015610576931471658,
1555
+ "loss": 0.6939,
1556
+ "mean_token_accuracy": 0.8114214852452278,
1557
+ "num_tokens": 23151737.0,
1558
+ "step": 1720
1559
+ },
1560
+ {
1561
+ "epoch": 1.053593179049939,
1562
+ "grad_norm": 0.5104020833969116,
1563
+ "learning_rate": 0.00015559656341680164,
1564
+ "loss": 0.716,
1565
+ "mean_token_accuracy": 0.8063826873898506,
1566
+ "num_tokens": 23280778.0,
1567
+ "step": 1730
1568
+ },
1569
+ {
1570
+ "epoch": 1.0596833130328867,
1571
+ "grad_norm": 0.5163984298706055,
1572
+ "learning_rate": 0.00015508538628570352,
1573
+ "loss": 0.7188,
1574
+ "mean_token_accuracy": 0.802527217566967,
1575
+ "num_tokens": 23410327.0,
1576
+ "step": 1740
1577
+ },
1578
+ {
1579
+ "epoch": 1.0657734470158344,
1580
+ "grad_norm": 0.5188373327255249,
1581
+ "learning_rate": 0.00015457226002066058,
1582
+ "loss": 0.6791,
1583
+ "mean_token_accuracy": 0.8127639785408973,
1584
+ "num_tokens": 23548616.0,
1585
+ "step": 1750
1586
+ },
1587
+ {
1588
+ "epoch": 1.071863580998782,
1589
+ "grad_norm": 0.5983869433403015,
1590
+ "learning_rate": 0.00015405720680517618,
1591
+ "loss": 0.6869,
1592
+ "mean_token_accuracy": 0.8110290810465812,
1593
+ "num_tokens": 23682446.0,
1594
+ "step": 1760
1595
+ },
1596
+ {
1597
+ "epoch": 1.0779537149817295,
1598
+ "grad_norm": 0.5919123291969299,
1599
+ "learning_rate": 0.00015354024890605985,
1600
+ "loss": 0.7419,
1601
+ "mean_token_accuracy": 0.7984233900904656,
1602
+ "num_tokens": 23806352.0,
1603
+ "step": 1770
1604
+ },
1605
+ {
1606
+ "epoch": 1.0840438489646773,
1607
+ "grad_norm": 0.4900698661804199,
1608
+ "learning_rate": 0.0001530214086724644,
1609
+ "loss": 0.6781,
1610
+ "mean_token_accuracy": 0.8152358055114746,
1611
+ "num_tokens": 23942964.0,
1612
+ "step": 1780
1613
+ },
1614
+ {
1615
+ "epoch": 1.0901339829476249,
1616
+ "grad_norm": 0.5409672856330872,
1617
+ "learning_rate": 0.00015250070853491986,
1618
+ "loss": 0.7157,
1619
+ "mean_token_accuracy": 0.803682966530323,
1620
+ "num_tokens": 24070937.0,
1621
+ "step": 1790
1622
+ },
1623
+ {
1624
+ "epoch": 1.0962241169305724,
1625
+ "grad_norm": 0.5581572651863098,
1626
+ "learning_rate": 0.0001519781710043638,
1627
+ "loss": 0.7261,
1628
+ "mean_token_accuracy": 0.8027503877878189,
1629
+ "num_tokens": 24200686.0,
1630
+ "step": 1800
1631
+ },
1632
+ {
1633
+ "epoch": 1.1023142509135202,
1634
+ "grad_norm": 0.503963053226471,
1635
+ "learning_rate": 0.0001514538186711679,
1636
+ "loss": 0.7125,
1637
+ "mean_token_accuracy": 0.8042754918336869,
1638
+ "num_tokens": 24329983.0,
1639
+ "step": 1810
1640
+ },
1641
+ {
1642
+ "epoch": 1.1084043848964678,
1643
+ "grad_norm": 0.6159723997116089,
1644
+ "learning_rate": 0.00015092767420416168,
1645
+ "loss": 0.6873,
1646
+ "mean_token_accuracy": 0.8115814313292503,
1647
+ "num_tokens": 24465292.0,
1648
+ "step": 1820
1649
+ },
1650
+ {
1651
+ "epoch": 1.1144945188794153,
1652
+ "grad_norm": 0.518172562122345,
1653
+ "learning_rate": 0.00015039976034965214,
1654
+ "loss": 0.6805,
1655
+ "mean_token_accuracy": 0.8113815248012543,
1656
+ "num_tokens": 24599980.0,
1657
+ "step": 1830
1658
+ },
1659
+ {
1660
+ "epoch": 1.1205846528623629,
1661
+ "grad_norm": 0.5381601452827454,
1662
+ "learning_rate": 0.0001498700999304407,
1663
+ "loss": 0.6542,
1664
+ "mean_token_accuracy": 0.8188014090061188,
1665
+ "num_tokens": 24746703.0,
1666
+ "step": 1840
1667
+ },
1668
+ {
1669
+ "epoch": 1.1266747868453106,
1670
+ "grad_norm": 0.5001223683357239,
1671
+ "learning_rate": 0.00014933871584483615,
1672
+ "loss": 0.7255,
1673
+ "mean_token_accuracy": 0.8022593036293983,
1674
+ "num_tokens": 24877604.0,
1675
+ "step": 1850
1676
+ },
1677
+ {
1678
+ "epoch": 1.1327649208282582,
1679
+ "grad_norm": 0.5812251567840576,
1680
+ "learning_rate": 0.00014880563106566512,
1681
+ "loss": 0.6638,
1682
+ "mean_token_accuracy": 0.8161928996443748,
1683
+ "num_tokens": 25023049.0,
1684
+ "step": 1860
1685
+ },
1686
+ {
1687
+ "epoch": 1.1388550548112057,
1688
+ "grad_norm": 0.5384249091148376,
1689
+ "learning_rate": 0.0001482708686392786,
1690
+ "loss": 0.6623,
1691
+ "mean_token_accuracy": 0.8167443484067917,
1692
+ "num_tokens": 25162124.0,
1693
+ "step": 1870
1694
+ },
1695
+ {
1696
+ "epoch": 1.1449451887941535,
1697
+ "grad_norm": 0.5310192108154297,
1698
+ "learning_rate": 0.00014773445168455576,
1699
+ "loss": 0.7074,
1700
+ "mean_token_accuracy": 0.8042578861117363,
1701
+ "num_tokens": 25293569.0,
1702
+ "step": 1880
1703
+ },
1704
+ {
1705
+ "epoch": 1.151035322777101,
1706
+ "grad_norm": 0.6224446296691895,
1707
+ "learning_rate": 0.00014719640339190443,
1708
+ "loss": 0.7094,
1709
+ "mean_token_accuracy": 0.803679920732975,
1710
+ "num_tokens": 25422953.0,
1711
+ "step": 1890
1712
+ },
1713
+ {
1714
+ "epoch": 1.1571254567600486,
1715
+ "grad_norm": 0.5978189706802368,
1716
+ "learning_rate": 0.00014665674702225853,
1717
+ "loss": 0.6926,
1718
+ "mean_token_accuracy": 0.8080565810203553,
1719
+ "num_tokens": 25559091.0,
1720
+ "step": 1900
1721
+ },
1722
+ {
1723
+ "epoch": 1.1632155907429964,
1724
+ "grad_norm": 0.6134657263755798,
1725
+ "learning_rate": 0.00014611550590607245,
1726
+ "loss": 0.6716,
1727
+ "mean_token_accuracy": 0.8152063637971878,
1728
+ "num_tokens": 25698134.0,
1729
+ "step": 1910
1730
+ },
1731
+ {
1732
+ "epoch": 1.169305724725944,
1733
+ "grad_norm": 0.5075950026512146,
1734
+ "learning_rate": 0.00014557270344231246,
1735
+ "loss": 0.6613,
1736
+ "mean_token_accuracy": 0.8169043198227882,
1737
+ "num_tokens": 25835159.0,
1738
+ "step": 1920
1739
+ },
1740
+ {
1741
+ "epoch": 1.1753958587088915,
1742
+ "grad_norm": 0.5035059452056885,
1743
+ "learning_rate": 0.00014502836309744508,
1744
+ "loss": 0.6903,
1745
+ "mean_token_accuracy": 0.8096718549728393,
1746
+ "num_tokens": 25970600.0,
1747
+ "step": 1930
1748
+ },
1749
+ {
1750
+ "epoch": 1.1814859926918393,
1751
+ "grad_norm": 0.583890438079834,
1752
+ "learning_rate": 0.00014448250840442254,
1753
+ "loss": 0.6662,
1754
+ "mean_token_accuracy": 0.8157578155398368,
1755
+ "num_tokens": 26106658.0,
1756
+ "step": 1940
1757
+ },
1758
+ {
1759
+ "epoch": 1.1875761266747868,
1760
+ "grad_norm": 0.5089572668075562,
1761
+ "learning_rate": 0.00014393516296166552,
1762
+ "loss": 0.7085,
1763
+ "mean_token_accuracy": 0.8082539036870002,
1764
+ "num_tokens": 26238847.0,
1765
+ "step": 1950
1766
+ },
1767
+ {
1768
+ "epoch": 1.1936662606577344,
1769
+ "grad_norm": 0.4495029151439667,
1770
+ "learning_rate": 0.00014338635043204288,
1771
+ "loss": 0.7085,
1772
+ "mean_token_accuracy": 0.8075269401073456,
1773
+ "num_tokens": 26366417.0,
1774
+ "step": 1960
1775
+ },
1776
+ {
1777
+ "epoch": 1.1997563946406822,
1778
+ "grad_norm": 0.6390108466148376,
1779
+ "learning_rate": 0.00014283609454184855,
1780
+ "loss": 0.6935,
1781
+ "mean_token_accuracy": 0.8099950149655342,
1782
+ "num_tokens": 26498101.0,
1783
+ "step": 1970
1784
+ },
1785
+ {
1786
+ "epoch": 1.2058465286236297,
1787
+ "grad_norm": 0.5687986016273499,
1788
+ "learning_rate": 0.00014228441907977607,
1789
+ "loss": 0.7027,
1790
+ "mean_token_accuracy": 0.8083449766039849,
1791
+ "num_tokens": 26628513.0,
1792
+ "step": 1980
1793
+ },
1794
+ {
1795
+ "epoch": 1.2119366626065773,
1796
+ "grad_norm": 0.487954318523407,
1797
+ "learning_rate": 0.00014173134789588994,
1798
+ "loss": 0.6731,
1799
+ "mean_token_accuracy": 0.8129799589514732,
1800
+ "num_tokens": 26761671.0,
1801
+ "step": 1990
1802
+ },
1803
+ {
1804
+ "epoch": 1.218026796589525,
1805
+ "grad_norm": 0.5641826391220093,
1806
+ "learning_rate": 0.00014117690490059447,
1807
+ "loss": 0.6949,
1808
+ "mean_token_accuracy": 0.8118783175945282,
1809
+ "num_tokens": 26894870.0,
1810
+ "step": 2000
1811
+ },
1812
+ {
1813
+ "epoch": 1.2241169305724726,
1814
+ "grad_norm": 0.5209829211235046,
1815
+ "learning_rate": 0.00014062111406360034,
1816
+ "loss": 0.6742,
1817
+ "mean_token_accuracy": 0.816123254597187,
1818
+ "num_tokens": 27027902.0,
1819
+ "step": 2010
1820
+ },
1821
+ {
1822
+ "epoch": 1.2302070645554202,
1823
+ "grad_norm": 0.5218231678009033,
1824
+ "learning_rate": 0.00014006399941288812,
1825
+ "loss": 0.703,
1826
+ "mean_token_accuracy": 0.805295330286026,
1827
+ "num_tokens": 27157882.0,
1828
+ "step": 2020
1829
+ },
1830
+ {
1831
+ "epoch": 1.236297198538368,
1832
+ "grad_norm": 0.48154470324516296,
1833
+ "learning_rate": 0.00013950558503366957,
1834
+ "loss": 0.6844,
1835
+ "mean_token_accuracy": 0.811684039235115,
1836
+ "num_tokens": 27290994.0,
1837
+ "step": 2030
1838
+ },
1839
+ {
1840
+ "epoch": 1.2423873325213155,
1841
+ "grad_norm": 0.5417695045471191,
1842
+ "learning_rate": 0.00013894589506734643,
1843
+ "loss": 0.7253,
1844
+ "mean_token_accuracy": 0.8018206775188446,
1845
+ "num_tokens": 27420715.0,
1846
+ "step": 2040
1847
+ },
1848
+ {
1849
+ "epoch": 1.248477466504263,
1850
+ "grad_norm": 0.5282937288284302,
1851
+ "learning_rate": 0.00013838495371046671,
1852
+ "loss": 0.682,
1853
+ "mean_token_accuracy": 0.8128980100154877,
1854
+ "num_tokens": 27552040.0,
1855
+ "step": 2050
1856
+ },
1857
+ {
1858
+ "epoch": 1.2545676004872108,
1859
+ "grad_norm": 0.5213696360588074,
1860
+ "learning_rate": 0.0001378227852136785,
1861
+ "loss": 0.6728,
1862
+ "mean_token_accuracy": 0.8128269612789154,
1863
+ "num_tokens": 27686922.0,
1864
+ "step": 2060
1865
+ },
1866
+ {
1867
+ "epoch": 1.2606577344701584,
1868
+ "grad_norm": 0.4823834300041199,
1869
+ "learning_rate": 0.00013725941388068174,
1870
+ "loss": 0.6626,
1871
+ "mean_token_accuracy": 0.8177949145436287,
1872
+ "num_tokens": 27825036.0,
1873
+ "step": 2070
1874
+ },
1875
+ {
1876
+ "epoch": 1.266747868453106,
1877
+ "grad_norm": 0.6199477314949036,
1878
+ "learning_rate": 0.0001366948640671775,
1879
+ "loss": 0.686,
1880
+ "mean_token_accuracy": 0.8107037082314491,
1881
+ "num_tokens": 27961614.0,
1882
+ "step": 2080
1883
+ },
1884
+ {
1885
+ "epoch": 1.2728380024360537,
1886
+ "grad_norm": 0.4916837513446808,
1887
+ "learning_rate": 0.00013612916017981488,
1888
+ "loss": 0.6738,
1889
+ "mean_token_accuracy": 0.8149923622608185,
1890
+ "num_tokens": 28099524.0,
1891
+ "step": 2090
1892
+ },
1893
+ {
1894
+ "epoch": 1.2789281364190013,
1895
+ "grad_norm": 0.6001724600791931,
1896
+ "learning_rate": 0.00013556232667513607,
1897
+ "loss": 0.6637,
1898
+ "mean_token_accuracy": 0.8173324480652809,
1899
+ "num_tokens": 28237055.0,
1900
+ "step": 2100
1901
+ },
1902
+ {
1903
+ "epoch": 1.2850182704019488,
1904
+ "grad_norm": 0.5887413620948792,
1905
+ "learning_rate": 0.00013499438805851882,
1906
+ "loss": 0.6744,
1907
+ "mean_token_accuracy": 0.8149967223405838,
1908
+ "num_tokens": 28370538.0,
1909
+ "step": 2110
1910
+ },
1911
+ {
1912
+ "epoch": 1.2911084043848966,
1913
+ "grad_norm": 0.6208155751228333,
1914
+ "learning_rate": 0.00013442536888311733,
1915
+ "loss": 0.6973,
1916
+ "mean_token_accuracy": 0.8103871151804924,
1917
+ "num_tokens": 28499232.0,
1918
+ "step": 2120
1919
+ },
1920
+ {
1921
+ "epoch": 1.2971985383678442,
1922
+ "grad_norm": 0.5026904344558716,
1923
+ "learning_rate": 0.0001338552937488003,
1924
+ "loss": 0.6739,
1925
+ "mean_token_accuracy": 0.8153023451566697,
1926
+ "num_tokens": 28633993.0,
1927
+ "step": 2130
1928
+ },
1929
+ {
1930
+ "epoch": 1.3032886723507917,
1931
+ "grad_norm": 0.5218458771705627,
1932
+ "learning_rate": 0.00013328418730108795,
1933
+ "loss": 0.6619,
1934
+ "mean_token_accuracy": 0.8166303977370262,
1935
+ "num_tokens": 28774139.0,
1936
+ "step": 2140
1937
+ },
1938
+ {
1939
+ "epoch": 1.3093788063337393,
1940
+ "grad_norm": 0.519872784614563,
1941
+ "learning_rate": 0.00013271207423008622,
1942
+ "loss": 0.6804,
1943
+ "mean_token_accuracy": 0.8150519266724586,
1944
+ "num_tokens": 28910109.0,
1945
+ "step": 2150
1946
+ },
1947
+ {
1948
+ "epoch": 1.315468940316687,
1949
+ "grad_norm": 0.5219667553901672,
1950
+ "learning_rate": 0.00013213897926941942,
1951
+ "loss": 0.6682,
1952
+ "mean_token_accuracy": 0.8166522830724716,
1953
+ "num_tokens": 29045967.0,
1954
+ "step": 2160
1955
+ },
1956
+ {
1957
+ "epoch": 1.3215590742996346,
1958
+ "grad_norm": 0.5744656920433044,
1959
+ "learning_rate": 0.000131564927195161,
1960
+ "loss": 0.6772,
1961
+ "mean_token_accuracy": 0.8149690836668014,
1962
+ "num_tokens": 29180769.0,
1963
+ "step": 2170
1964
+ },
1965
+ {
1966
+ "epoch": 1.3276492082825821,
1967
+ "grad_norm": 0.5673508048057556,
1968
+ "learning_rate": 0.00013098994282476236,
1969
+ "loss": 0.6841,
1970
+ "mean_token_accuracy": 0.812624742090702,
1971
+ "num_tokens": 29313512.0,
1972
+ "step": 2180
1973
+ },
1974
+ {
1975
+ "epoch": 1.3337393422655297,
1976
+ "grad_norm": 0.5187074542045593,
1977
+ "learning_rate": 0.00013041405101598,
1978
+ "loss": 0.6281,
1979
+ "mean_token_accuracy": 0.8221091449260711,
1980
+ "num_tokens": 29454589.0,
1981
+ "step": 2190
1982
+ },
1983
+ {
1984
+ "epoch": 1.3398294762484775,
1985
+ "grad_norm": 0.5621201992034912,
1986
+ "learning_rate": 0.00012983727666580086,
1987
+ "loss": 0.6755,
1988
+ "mean_token_accuracy": 0.8157430678606034,
1989
+ "num_tokens": 29589968.0,
1990
+ "step": 2200
1991
+ },
1992
+ {
1993
+ "epoch": 1.345919610231425,
1994
+ "grad_norm": 0.579699695110321,
1995
+ "learning_rate": 0.00012925964470936598,
1996
+ "loss": 0.6859,
1997
+ "mean_token_accuracy": 0.8122102931141854,
1998
+ "num_tokens": 29720188.0,
1999
+ "step": 2210
2000
+ },
2001
+ {
2002
+ "epoch": 1.3520097442143726,
2003
+ "grad_norm": 0.6406823992729187,
2004
+ "learning_rate": 0.00012868118011889236,
2005
+ "loss": 0.684,
2006
+ "mean_token_accuracy": 0.8107294023036957,
2007
+ "num_tokens": 29848418.0,
2008
+ "step": 2220
2009
+ },
2010
+ {
2011
+ "epoch": 1.3580998781973204,
2012
+ "grad_norm": 0.4707708954811096,
2013
+ "learning_rate": 0.00012810190790259367,
2014
+ "loss": 0.6607,
2015
+ "mean_token_accuracy": 0.8182852879166603,
2016
+ "num_tokens": 29988202.0,
2017
+ "step": 2230
2018
+ },
2019
+ {
2020
+ "epoch": 1.364190012180268,
2021
+ "grad_norm": 0.6458183526992798,
2022
+ "learning_rate": 0.00012752185310359874,
2023
+ "loss": 0.6935,
2024
+ "mean_token_accuracy": 0.8089477211236954,
2025
+ "num_tokens": 30119777.0,
2026
+ "step": 2240
2027
+ },
2028
+ {
2029
+ "epoch": 1.3702801461632155,
2030
+ "grad_norm": 0.4278848469257355,
2031
+ "learning_rate": 0.00012694104079886918,
2032
+ "loss": 0.6565,
2033
+ "mean_token_accuracy": 0.8185079246759415,
2034
+ "num_tokens": 30256776.0,
2035
+ "step": 2250
2036
+ },
2037
+ {
2038
+ "epoch": 1.3763702801461632,
2039
+ "grad_norm": 0.5647698044776917,
2040
+ "learning_rate": 0.00012635949609811505,
2041
+ "loss": 0.6636,
2042
+ "mean_token_accuracy": 0.8155051723122597,
2043
+ "num_tokens": 30395629.0,
2044
+ "step": 2260
2045
+ },
2046
+ {
2047
+ "epoch": 1.3824604141291108,
2048
+ "grad_norm": 0.43498411774635315,
2049
+ "learning_rate": 0.00012577724414270937,
2050
+ "loss": 0.689,
2051
+ "mean_token_accuracy": 0.8125654354691505,
2052
+ "num_tokens": 30532805.0,
2053
+ "step": 2270
2054
+ },
2055
+ {
2056
+ "epoch": 1.3885505481120584,
2057
+ "grad_norm": 0.5296844244003296,
2058
+ "learning_rate": 0.00012519431010460136,
2059
+ "loss": 0.6854,
2060
+ "mean_token_accuracy": 0.8122918352484703,
2061
+ "num_tokens": 30664642.0,
2062
+ "step": 2280
2063
+ },
2064
+ {
2065
+ "epoch": 1.3946406820950061,
2066
+ "grad_norm": 0.44080430269241333,
2067
+ "learning_rate": 0.000124610719185228,
2068
+ "loss": 0.6405,
2069
+ "mean_token_accuracy": 0.8192834481596947,
2070
+ "num_tokens": 30805370.0,
2071
+ "step": 2290
2072
+ },
2073
+ {
2074
+ "epoch": 1.4007308160779537,
2075
+ "grad_norm": 0.5946847796440125,
2076
+ "learning_rate": 0.00012402649661442453,
2077
+ "loss": 0.7025,
2078
+ "mean_token_accuracy": 0.8085126876831055,
2079
+ "num_tokens": 30936385.0,
2080
+ "step": 2300
2081
+ },
2082
+ {
2083
+ "epoch": 1.4068209500609012,
2084
+ "grad_norm": 0.6572047472000122,
2085
+ "learning_rate": 0.0001234416676493339,
2086
+ "loss": 0.709,
2087
+ "mean_token_accuracy": 0.8046677514910698,
2088
+ "num_tokens": 31067615.0,
2089
+ "step": 2310
2090
+ },
2091
+ {
2092
+ "epoch": 1.412911084043849,
2093
+ "grad_norm": 0.4797047972679138,
2094
+ "learning_rate": 0.0001228562575733147,
2095
+ "loss": 0.6675,
2096
+ "mean_token_accuracy": 0.8157136350870132,
2097
+ "num_tokens": 31200044.0,
2098
+ "step": 2320
2099
+ },
2100
+ {
2101
+ "epoch": 1.4190012180267966,
2102
+ "grad_norm": 0.5451430082321167,
2103
+ "learning_rate": 0.0001222702916948481,
2104
+ "loss": 0.6746,
2105
+ "mean_token_accuracy": 0.8092615008354187,
2106
+ "num_tokens": 31334451.0,
2107
+ "step": 2330
2108
+ },
2109
+ {
2110
+ "epoch": 1.4250913520097441,
2111
+ "grad_norm": 0.5049906969070435,
2112
+ "learning_rate": 0.00012168379534644371,
2113
+ "loss": 0.6515,
2114
+ "mean_token_accuracy": 0.8203717589378356,
2115
+ "num_tokens": 31472218.0,
2116
+ "step": 2340
2117
+ },
2118
+ {
2119
+ "epoch": 1.431181485992692,
2120
+ "grad_norm": 0.6531693935394287,
2121
+ "learning_rate": 0.00012109679388354462,
2122
+ "loss": 0.6778,
2123
+ "mean_token_accuracy": 0.8134923160076142,
2124
+ "num_tokens": 31605853.0,
2125
+ "step": 2350
2126
+ },
2127
+ {
2128
+ "epoch": 1.4372716199756395,
2129
+ "grad_norm": 0.5340039730072021,
2130
+ "learning_rate": 0.00012050931268343089,
2131
+ "loss": 0.6628,
2132
+ "mean_token_accuracy": 0.8176047816872597,
2133
+ "num_tokens": 31741034.0,
2134
+ "step": 2360
2135
+ },
2136
+ {
2137
+ "epoch": 1.443361753958587,
2138
+ "grad_norm": 0.4518280625343323,
2139
+ "learning_rate": 0.00011992137714412266,
2140
+ "loss": 0.6407,
2141
+ "mean_token_accuracy": 0.8207336485385894,
2142
+ "num_tokens": 31878661.0,
2143
+ "step": 2370
2144
+ },
2145
+ {
2146
+ "epoch": 1.4494518879415348,
2147
+ "grad_norm": 0.5232827067375183,
2148
+ "learning_rate": 0.00011933301268328212,
2149
+ "loss": 0.6742,
2150
+ "mean_token_accuracy": 0.8158077761530876,
2151
+ "num_tokens": 32016524.0,
2152
+ "step": 2380
2153
+ },
2154
+ {
2155
+ "epoch": 1.4555420219244823,
2156
+ "grad_norm": 0.5181542634963989,
2157
+ "learning_rate": 0.00011874424473711457,
2158
+ "loss": 0.699,
2159
+ "mean_token_accuracy": 0.8078866004943848,
2160
+ "num_tokens": 32146820.0,
2161
+ "step": 2390
2162
+ },
2163
+ {
2164
+ "epoch": 1.46163215590743,
2165
+ "grad_norm": 0.5801041126251221,
2166
+ "learning_rate": 0.00011815509875926883,
2167
+ "loss": 0.6572,
2168
+ "mean_token_accuracy": 0.8183338135480881,
2169
+ "num_tokens": 32285928.0,
2170
+ "step": 2400
2171
+ },
2172
+ {
2173
+ "epoch": 1.4677222898903777,
2174
+ "grad_norm": 0.5347133874893188,
2175
+ "learning_rate": 0.00011756560021973679,
2176
+ "loss": 0.6738,
2177
+ "mean_token_accuracy": 0.8143690213561058,
2178
+ "num_tokens": 32416470.0,
2179
+ "step": 2410
2180
+ },
2181
+ {
2182
+ "epoch": 1.4738124238733252,
2183
+ "grad_norm": 0.4945615231990814,
2184
+ "learning_rate": 0.0001169757746037524,
2185
+ "loss": 0.6505,
2186
+ "mean_token_accuracy": 0.8196728631854058,
2187
+ "num_tokens": 32553798.0,
2188
+ "step": 2420
2189
+ },
2190
+ {
2191
+ "epoch": 1.4799025578562728,
2192
+ "grad_norm": 0.5072743892669678,
2193
+ "learning_rate": 0.00011638564741068965,
2194
+ "loss": 0.625,
2195
+ "mean_token_accuracy": 0.826240348815918,
2196
+ "num_tokens": 32692511.0,
2197
+ "step": 2430
2198
+ },
2199
+ {
2200
+ "epoch": 1.4859926918392206,
2201
+ "grad_norm": 0.5887538194656372,
2202
+ "learning_rate": 0.00011579524415296043,
2203
+ "loss": 0.6904,
2204
+ "mean_token_accuracy": 0.8112018033862114,
2205
+ "num_tokens": 32818836.0,
2206
+ "step": 2440
2207
+ },
2208
+ {
2209
+ "epoch": 1.4920828258221681,
2210
+ "grad_norm": 0.5464449524879456,
2211
+ "learning_rate": 0.00011520459035491142,
2212
+ "loss": 0.6553,
2213
+ "mean_token_accuracy": 0.8198345899581909,
2214
+ "num_tokens": 32957967.0,
2215
+ "step": 2450
2216
+ },
2217
+ {
2218
+ "epoch": 1.4981729598051157,
2219
+ "grad_norm": 0.5787419676780701,
2220
+ "learning_rate": 0.00011461371155172071,
2221
+ "loss": 0.663,
2222
+ "mean_token_accuracy": 0.8155046373605728,
2223
+ "num_tokens": 33094241.0,
2224
+ "step": 2460
2225
+ },
2226
+ {
2227
+ "epoch": 1.5042630937880634,
2228
+ "grad_norm": 0.5159268975257874,
2229
+ "learning_rate": 0.00011402263328829384,
2230
+ "loss": 0.6792,
2231
+ "mean_token_accuracy": 0.8127613604068756,
2232
+ "num_tokens": 33225474.0,
2233
+ "step": 2470
2234
+ },
2235
+ {
2236
+ "epoch": 1.510353227771011,
2237
+ "grad_norm": 0.5665333867073059,
2238
+ "learning_rate": 0.00011343138111815939,
2239
+ "loss": 0.6265,
2240
+ "mean_token_accuracy": 0.8276977241039276,
2241
+ "num_tokens": 33368246.0,
2242
+ "step": 2480
2243
+ },
2244
+ {
2245
+ "epoch": 1.5164433617539586,
2246
+ "grad_norm": 0.6272276639938354,
2247
+ "learning_rate": 0.00011283998060236421,
2248
+ "loss": 0.6734,
2249
+ "mean_token_accuracy": 0.816029068827629,
2250
+ "num_tokens": 33503967.0,
2251
+ "step": 2490
2252
+ },
2253
+ {
2254
+ "epoch": 1.5225334957369063,
2255
+ "grad_norm": 0.5275886654853821,
2256
+ "learning_rate": 0.0001122484573083686,
2257
+ "loss": 0.6457,
2258
+ "mean_token_accuracy": 0.8222623988986015,
2259
+ "num_tokens": 33641826.0,
2260
+ "step": 2500
2261
+ },
2262
+ {
2263
+ "epoch": 1.5286236297198539,
2264
+ "grad_norm": 0.5526687502861023,
2265
+ "learning_rate": 0.00011165683680894072,
2266
+ "loss": 0.6795,
2267
+ "mean_token_accuracy": 0.8127825185656548,
2268
+ "num_tokens": 33774185.0,
2269
+ "step": 2510
2270
+ },
2271
+ {
2272
+ "epoch": 1.5347137637028014,
2273
+ "grad_norm": 0.6226133704185486,
2274
+ "learning_rate": 0.00011106514468105111,
2275
+ "loss": 0.6684,
2276
+ "mean_token_accuracy": 0.815614765882492,
2277
+ "num_tokens": 33907116.0,
2278
+ "step": 2520
2279
+ },
2280
+ {
2281
+ "epoch": 1.5408038976857492,
2282
+ "grad_norm": 0.612832248210907,
2283
+ "learning_rate": 0.000110473406504767,
2284
+ "loss": 0.6287,
2285
+ "mean_token_accuracy": 0.8220825806260109,
2286
+ "num_tokens": 34048267.0,
2287
+ "step": 2530
2288
+ },
2289
+ {
2290
+ "epoch": 1.5468940316686965,
2291
+ "grad_norm": 0.6066681742668152,
2292
+ "learning_rate": 0.00010988164786214639,
2293
+ "loss": 0.6851,
2294
+ "mean_token_accuracy": 0.8115911707282066,
2295
+ "num_tokens": 34177555.0,
2296
+ "step": 2540
2297
+ },
2298
+ {
2299
+ "epoch": 1.5529841656516443,
2300
+ "grad_norm": 0.6376360058784485,
2301
+ "learning_rate": 0.00010928989433613204,
2302
+ "loss": 0.6921,
2303
+ "mean_token_accuracy": 0.8096534594893455,
2304
+ "num_tokens": 34308932.0,
2305
+ "step": 2550
2306
+ },
2307
+ {
2308
+ "epoch": 1.559074299634592,
2309
+ "grad_norm": 0.6083400249481201,
2310
+ "learning_rate": 0.00010869817150944546,
2311
+ "loss": 0.6575,
2312
+ "mean_token_accuracy": 0.8187816679477692,
2313
+ "num_tokens": 34443994.0,
2314
+ "step": 2560
2315
+ },
2316
+ {
2317
+ "epoch": 1.5651644336175394,
2318
+ "grad_norm": 0.6098156571388245,
2319
+ "learning_rate": 0.00010810650496348116,
2320
+ "loss": 0.6092,
2321
+ "mean_token_accuracy": 0.8285523638129234,
2322
+ "num_tokens": 34588403.0,
2323
+ "step": 2570
2324
+ },
2325
+ {
2326
+ "epoch": 1.5712545676004872,
2327
+ "grad_norm": 0.47795701026916504,
2328
+ "learning_rate": 0.00010751492027720027,
2329
+ "loss": 0.6423,
2330
+ "mean_token_accuracy": 0.8211737647652626,
2331
+ "num_tokens": 34730426.0,
2332
+ "step": 2580
2333
+ },
2334
+ {
2335
+ "epoch": 1.577344701583435,
2336
+ "grad_norm": 0.560787558555603,
2337
+ "learning_rate": 0.00010692344302602515,
2338
+ "loss": 0.6707,
2339
+ "mean_token_accuracy": 0.8134441033005715,
2340
+ "num_tokens": 34861708.0,
2341
+ "step": 2590
2342
+ },
2343
+ {
2344
+ "epoch": 1.5834348355663823,
2345
+ "grad_norm": 0.5722246766090393,
2346
+ "learning_rate": 0.00010633209878073343,
2347
+ "loss": 0.6533,
2348
+ "mean_token_accuracy": 0.8185199156403542,
2349
+ "num_tokens": 34997377.0,
2350
+ "step": 2600
2351
+ },
2352
+ {
2353
+ "epoch": 1.58952496954933,
2354
+ "grad_norm": 0.4941788613796234,
2355
+ "learning_rate": 0.00010574091310635263,
2356
+ "loss": 0.6487,
2357
+ "mean_token_accuracy": 0.8205527886748314,
2358
+ "num_tokens": 35133685.0,
2359
+ "step": 2610
2360
+ },
2361
+ {
2362
+ "epoch": 1.5956151035322779,
2363
+ "grad_norm": 0.575986921787262,
2364
+ "learning_rate": 0.00010514991156105493,
2365
+ "loss": 0.6615,
2366
+ "mean_token_accuracy": 0.8179458349943161,
2367
+ "num_tokens": 35270993.0,
2368
+ "step": 2620
2369
+ },
2370
+ {
2371
+ "epoch": 1.6017052375152252,
2372
+ "grad_norm": 0.5677866339683533,
2373
+ "learning_rate": 0.00010455911969505228,
2374
+ "loss": 0.6572,
2375
+ "mean_token_accuracy": 0.8155815675854683,
2376
+ "num_tokens": 35402062.0,
2377
+ "step": 2630
2378
+ },
2379
+ {
2380
+ "epoch": 1.607795371498173,
2381
+ "grad_norm": 0.6232825517654419,
2382
+ "learning_rate": 0.00010396856304949162,
2383
+ "loss": 0.6477,
2384
+ "mean_token_accuracy": 0.8209305629134178,
2385
+ "num_tokens": 35537394.0,
2386
+ "step": 2640
2387
+ },
2388
+ {
2389
+ "epoch": 1.6138855054811205,
2390
+ "grad_norm": 0.6252410411834717,
2391
+ "learning_rate": 0.00010337826715535102,
2392
+ "loss": 0.6819,
2393
+ "mean_token_accuracy": 0.8137489795684815,
2394
+ "num_tokens": 35669332.0,
2395
+ "step": 2650
2396
+ },
2397
+ {
2398
+ "epoch": 1.619975639464068,
2399
+ "grad_norm": 0.5850580334663391,
2400
+ "learning_rate": 0.0001027882575323356,
2401
+ "loss": 0.6831,
2402
+ "mean_token_accuracy": 0.8099577218294144,
2403
+ "num_tokens": 35799095.0,
2404
+ "step": 2660
2405
+ },
2406
+ {
2407
+ "epoch": 1.6260657734470159,
2408
+ "grad_norm": 0.5118699073791504,
2409
+ "learning_rate": 0.00010219855968777442,
2410
+ "loss": 0.681,
2411
+ "mean_token_accuracy": 0.8123177006840706,
2412
+ "num_tokens": 35928313.0,
2413
+ "step": 2670
2414
+ },
2415
+ {
2416
+ "epoch": 1.6321559074299634,
2417
+ "grad_norm": 0.5392698645591736,
2418
+ "learning_rate": 0.00010160919911551774,
2419
+ "loss": 0.6536,
2420
+ "mean_token_accuracy": 0.8185337752103805,
2421
+ "num_tokens": 36062033.0,
2422
+ "step": 2680
2423
+ },
2424
+ {
2425
+ "epoch": 1.638246041412911,
2426
+ "grad_norm": 0.5542203783988953,
2427
+ "learning_rate": 0.00010102020129483481,
2428
+ "loss": 0.6859,
2429
+ "mean_token_accuracy": 0.8107540607452393,
2430
+ "num_tokens": 36190194.0,
2431
+ "step": 2690
2432
+ },
2433
+ {
2434
+ "epoch": 1.6443361753958587,
2435
+ "grad_norm": 0.5962918996810913,
2436
+ "learning_rate": 0.0001004315916893124,
2437
+ "loss": 0.64,
2438
+ "mean_token_accuracy": 0.8226593688130379,
2439
+ "num_tokens": 36322437.0,
2440
+ "step": 2700
2441
+ },
2442
+ {
2443
+ "epoch": 1.6504263093788063,
2444
+ "grad_norm": 0.6391364932060242,
2445
+ "learning_rate": 9.984339574575394e-05,
2446
+ "loss": 0.6457,
2447
+ "mean_token_accuracy": 0.8250340327620507,
2448
+ "num_tokens": 36463231.0,
2449
+ "step": 2710
2450
+ },
2451
+ {
2452
+ "epoch": 1.6565164433617539,
2453
+ "grad_norm": 0.5798075795173645,
2454
+ "learning_rate": 9.92556388930794e-05,
2455
+ "loss": 0.6901,
2456
+ "mean_token_accuracy": 0.8104871213436127,
2457
+ "num_tokens": 36588963.0,
2458
+ "step": 2720
2459
+ },
2460
+ {
2461
+ "epoch": 1.6626065773447016,
2462
+ "grad_norm": 0.5375143885612488,
2463
+ "learning_rate": 9.866834654122597e-05,
2464
+ "loss": 0.6723,
2465
+ "mean_token_accuracy": 0.8132491707801819,
2466
+ "num_tokens": 36724295.0,
2467
+ "step": 2730
2468
+ },
2469
+ {
2470
+ "epoch": 1.6686967113276492,
2471
+ "grad_norm": 0.5556331276893616,
2472
+ "learning_rate": 9.808154408004942e-05,
2473
+ "loss": 0.6316,
2474
+ "mean_token_accuracy": 0.8221101492643357,
2475
+ "num_tokens": 36855978.0,
2476
+ "step": 2740
2477
+ },
2478
+ {
2479
+ "epoch": 1.6747868453105967,
2480
+ "grad_norm": 0.5330142974853516,
2481
+ "learning_rate": 9.749525687822674e-05,
2482
+ "loss": 0.6269,
2483
+ "mean_token_accuracy": 0.8239532545208931,
2484
+ "num_tokens": 36994164.0,
2485
+ "step": 2750
2486
+ },
2487
+ {
2488
+ "epoch": 1.6808769792935445,
2489
+ "grad_norm": 0.568084716796875,
2490
+ "learning_rate": 9.6909510282159e-05,
2491
+ "loss": 0.6568,
2492
+ "mean_token_accuracy": 0.8158794924616813,
2493
+ "num_tokens": 37130680.0,
2494
+ "step": 2760
2495
+ },
2496
+ {
2497
+ "epoch": 1.686967113276492,
2498
+ "grad_norm": 0.5072943568229675,
2499
+ "learning_rate": 9.632432961487585e-05,
2500
+ "loss": 0.6838,
2501
+ "mean_token_accuracy": 0.8121756613254547,
2502
+ "num_tokens": 37261462.0,
2503
+ "step": 2770
2504
+ },
2505
+ {
2506
+ "epoch": 1.6930572472594396,
2507
+ "grad_norm": 0.5469337701797485,
2508
+ "learning_rate": 9.573974017494069e-05,
2509
+ "loss": 0.6447,
2510
+ "mean_token_accuracy": 0.8220986798405647,
2511
+ "num_tokens": 37395606.0,
2512
+ "step": 2780
2513
+ },
2514
+ {
2515
+ "epoch": 1.6991473812423874,
2516
+ "grad_norm": 0.57918381690979,
2517
+ "learning_rate": 9.515576723535689e-05,
2518
+ "loss": 0.6217,
2519
+ "mean_token_accuracy": 0.822702020406723,
2520
+ "num_tokens": 37533585.0,
2521
+ "step": 2790
2522
+ },
2523
+ {
2524
+ "epoch": 1.705237515225335,
2525
+ "grad_norm": 0.6425563097000122,
2526
+ "learning_rate": 9.45724360424753e-05,
2527
+ "loss": 0.6435,
2528
+ "mean_token_accuracy": 0.8198476612567902,
2529
+ "num_tokens": 37672877.0,
2530
+ "step": 2800
2531
+ },
2532
+ {
2533
+ "epoch": 1.7113276492082825,
2534
+ "grad_norm": 0.5059729218482971,
2535
+ "learning_rate": 9.398977181490274e-05,
2536
+ "loss": 0.6579,
2537
+ "mean_token_accuracy": 0.8166012555360794,
2538
+ "num_tokens": 37809109.0,
2539
+ "step": 2810
2540
+ },
2541
+ {
2542
+ "epoch": 1.7174177831912303,
2543
+ "grad_norm": 0.5450888276100159,
2544
+ "learning_rate": 9.340779974241167e-05,
2545
+ "loss": 0.6175,
2546
+ "mean_token_accuracy": 0.8274259582161904,
2547
+ "num_tokens": 37950597.0,
2548
+ "step": 2820
2549
+ },
2550
+ {
2551
+ "epoch": 1.7235079171741778,
2552
+ "grad_norm": 0.6464765667915344,
2553
+ "learning_rate": 9.282654498485139e-05,
2554
+ "loss": 0.6636,
2555
+ "mean_token_accuracy": 0.8163545817136765,
2556
+ "num_tokens": 38086904.0,
2557
+ "step": 2830
2558
+ },
2559
+ {
2560
+ "epoch": 1.7295980511571254,
2561
+ "grad_norm": 0.6118177175521851,
2562
+ "learning_rate": 9.22460326710601e-05,
2563
+ "loss": 0.6696,
2564
+ "mean_token_accuracy": 0.8133967757225037,
2565
+ "num_tokens": 38219759.0,
2566
+ "step": 2840
2567
+ },
2568
+ {
2569
+ "epoch": 1.7356881851400732,
2570
+ "grad_norm": 0.5518969893455505,
2571
+ "learning_rate": 9.16662878977786e-05,
2572
+ "loss": 0.6659,
2573
+ "mean_token_accuracy": 0.8180875137448311,
2574
+ "num_tokens": 38349770.0,
2575
+ "step": 2850
2576
+ },
2577
+ {
2578
+ "epoch": 1.7417783191230207,
2579
+ "grad_norm": 0.6465517282485962,
2580
+ "learning_rate": 9.108733572856549e-05,
2581
+ "loss": 0.6581,
2582
+ "mean_token_accuracy": 0.8170399129390716,
2583
+ "num_tokens": 38482303.0,
2584
+ "step": 2860
2585
+ },
2586
+ {
2587
+ "epoch": 1.7478684531059683,
2588
+ "grad_norm": 0.5193557143211365,
2589
+ "learning_rate": 9.050920119271335e-05,
2590
+ "loss": 0.6543,
2591
+ "mean_token_accuracy": 0.8178304255008697,
2592
+ "num_tokens": 38615426.0,
2593
+ "step": 2870
2594
+ },
2595
+ {
2596
+ "epoch": 1.753958587088916,
2597
+ "grad_norm": 0.611529529094696,
2598
+ "learning_rate": 8.993190928416682e-05,
2599
+ "loss": 0.6248,
2600
+ "mean_token_accuracy": 0.8259203046560287,
2601
+ "num_tokens": 38755859.0,
2602
+ "step": 2880
2603
+ },
2604
+ {
2605
+ "epoch": 1.7600487210718636,
2606
+ "grad_norm": 0.5405944585800171,
2607
+ "learning_rate": 8.935548496044198e-05,
2608
+ "loss": 0.6232,
2609
+ "mean_token_accuracy": 0.8281204700469971,
2610
+ "num_tokens": 38893007.0,
2611
+ "step": 2890
2612
+ },
2613
+ {
2614
+ "epoch": 1.7661388550548112,
2615
+ "grad_norm": 0.6433010697364807,
2616
+ "learning_rate": 8.877995314154748e-05,
2617
+ "loss": 0.6751,
2618
+ "mean_token_accuracy": 0.8155393078923225,
2619
+ "num_tokens": 39020285.0,
2620
+ "step": 2900
2621
+ },
2622
+ {
2623
+ "epoch": 1.772228989037759,
2624
+ "grad_norm": 0.47974956035614014,
2625
+ "learning_rate": 8.820533870890717e-05,
2626
+ "loss": 0.6527,
2627
+ "mean_token_accuracy": 0.8197720810770989,
2628
+ "num_tokens": 39151426.0,
2629
+ "step": 2910
2630
+ },
2631
+ {
2632
+ "epoch": 1.7783191230207065,
2633
+ "grad_norm": 0.5529680848121643,
2634
+ "learning_rate": 8.763166650428436e-05,
2635
+ "loss": 0.6262,
2636
+ "mean_token_accuracy": 0.8256829127669334,
2637
+ "num_tokens": 39294242.0,
2638
+ "step": 2920
2639
+ },
2640
+ {
2641
+ "epoch": 1.784409257003654,
2642
+ "grad_norm": 0.6060122847557068,
2643
+ "learning_rate": 8.705896132870797e-05,
2644
+ "loss": 0.6563,
2645
+ "mean_token_accuracy": 0.8192467406392098,
2646
+ "num_tokens": 39425879.0,
2647
+ "step": 2930
2648
+ },
2649
+ {
2650
+ "epoch": 1.7904993909866018,
2651
+ "grad_norm": 0.6099355220794678,
2652
+ "learning_rate": 8.648724794140017e-05,
2653
+ "loss": 0.6664,
2654
+ "mean_token_accuracy": 0.8186777010560036,
2655
+ "num_tokens": 39559787.0,
2656
+ "step": 2940
2657
+ },
2658
+ {
2659
+ "epoch": 1.7965895249695494,
2660
+ "grad_norm": 0.5908733010292053,
2661
+ "learning_rate": 8.591655105870615e-05,
2662
+ "loss": 0.6712,
2663
+ "mean_token_accuracy": 0.8136340633034707,
2664
+ "num_tokens": 39689823.0,
2665
+ "step": 2950
2666
+ },
2667
+ {
2668
+ "epoch": 1.802679658952497,
2669
+ "grad_norm": 0.5845519304275513,
2670
+ "learning_rate": 8.534689535302553e-05,
2671
+ "loss": 0.6608,
2672
+ "mean_token_accuracy": 0.8170475289225578,
2673
+ "num_tokens": 39820725.0,
2674
+ "step": 2960
2675
+ },
2676
+ {
2677
+ "epoch": 1.8087697929354447,
2678
+ "grad_norm": 0.6311175227165222,
2679
+ "learning_rate": 8.47783054517457e-05,
2680
+ "loss": 0.6491,
2681
+ "mean_token_accuracy": 0.8193596869707107,
2682
+ "num_tokens": 39947874.0,
2683
+ "step": 2970
2684
+ },
2685
+ {
2686
+ "epoch": 1.814859926918392,
2687
+ "grad_norm": 0.5293188691139221,
2688
+ "learning_rate": 8.421080593617706e-05,
2689
+ "loss": 0.6105,
2690
+ "mean_token_accuracy": 0.83141258507967,
2691
+ "num_tokens": 40091297.0,
2692
+ "step": 2980
2693
+ },
2694
+ {
2695
+ "epoch": 1.8209500609013398,
2696
+ "grad_norm": 0.5252617597579956,
2697
+ "learning_rate": 8.364442134049049e-05,
2698
+ "loss": 0.6356,
2699
+ "mean_token_accuracy": 0.8237936720252037,
2700
+ "num_tokens": 40229207.0,
2701
+ "step": 2990
2702
+ },
2703
+ {
2704
+ "epoch": 1.8270401948842876,
2705
+ "grad_norm": 0.6039798855781555,
2706
+ "learning_rate": 8.30791761506565e-05,
2707
+ "loss": 0.6456,
2708
+ "mean_token_accuracy": 0.8206364914774895,
2709
+ "num_tokens": 40364863.0,
2710
+ "step": 3000
2711
+ },
2712
+ {
2713
+ "epoch": 1.833130328867235,
2714
+ "grad_norm": 0.5508609414100647,
2715
+ "learning_rate": 8.251509480338684e-05,
2716
+ "loss": 0.6229,
2717
+ "mean_token_accuracy": 0.8255992740392685,
2718
+ "num_tokens": 40504123.0,
2719
+ "step": 3010
2720
+ },
2721
+ {
2722
+ "epoch": 1.8392204628501827,
2723
+ "grad_norm": 0.5637634992599487,
2724
+ "learning_rate": 8.195220168507789e-05,
2725
+ "loss": 0.6026,
2726
+ "mean_token_accuracy": 0.8290412962436676,
2727
+ "num_tokens": 40646821.0,
2728
+ "step": 3020
2729
+ },
2730
+ {
2731
+ "epoch": 1.8453105968331305,
2732
+ "grad_norm": 0.5463610291481018,
2733
+ "learning_rate": 8.139052113075645e-05,
2734
+ "loss": 0.6278,
2735
+ "mean_token_accuracy": 0.8244929850101471,
2736
+ "num_tokens": 40778989.0,
2737
+ "step": 3030
2738
+ },
2739
+ {
2740
+ "epoch": 1.8514007308160778,
2741
+ "grad_norm": 0.5360645055770874,
2742
+ "learning_rate": 8.083007742302776e-05,
2743
+ "loss": 0.6336,
2744
+ "mean_token_accuracy": 0.8228462666273118,
2745
+ "num_tokens": 40917560.0,
2746
+ "step": 3040
2747
+ },
2748
+ {
2749
+ "epoch": 1.8574908647990256,
2750
+ "grad_norm": 0.5185632705688477,
2751
+ "learning_rate": 8.02708947910255e-05,
2752
+ "loss": 0.5991,
2753
+ "mean_token_accuracy": 0.830042028427124,
2754
+ "num_tokens": 41059707.0,
2755
+ "step": 3050
2756
+ },
2757
+ {
2758
+ "epoch": 1.8635809987819734,
2759
+ "grad_norm": 0.6445353627204895,
2760
+ "learning_rate": 7.971299740936456e-05,
2761
+ "loss": 0.6555,
2762
+ "mean_token_accuracy": 0.8169184163212776,
2763
+ "num_tokens": 41192515.0,
2764
+ "step": 3060
2765
+ },
2766
+ {
2767
+ "epoch": 1.8696711327649207,
2768
+ "grad_norm": 0.5360421538352966,
2769
+ "learning_rate": 7.915640939709576e-05,
2770
+ "loss": 0.6234,
2771
+ "mean_token_accuracy": 0.8257398083806038,
2772
+ "num_tokens": 41330047.0,
2773
+ "step": 3070
2774
+ },
2775
+ {
2776
+ "epoch": 1.8757612667478685,
2777
+ "grad_norm": 0.58651202917099,
2778
+ "learning_rate": 7.860115481666333e-05,
2779
+ "loss": 0.6564,
2780
+ "mean_token_accuracy": 0.8205534905195236,
2781
+ "num_tokens": 41460379.0,
2782
+ "step": 3080
2783
+ },
2784
+ {
2785
+ "epoch": 1.881851400730816,
2786
+ "grad_norm": 0.6842640042304993,
2787
+ "learning_rate": 7.804725767286427e-05,
2788
+ "loss": 0.6935,
2789
+ "mean_token_accuracy": 0.8097458809614182,
2790
+ "num_tokens": 41581210.0,
2791
+ "step": 3090
2792
+ },
2793
+ {
2794
+ "epoch": 1.8879415347137636,
2795
+ "grad_norm": 0.5175514817237854,
2796
+ "learning_rate": 7.749474191181096e-05,
2797
+ "loss": 0.6393,
2798
+ "mean_token_accuracy": 0.8219558611512184,
2799
+ "num_tokens": 41714792.0,
2800
+ "step": 3100
2801
+ },
2802
+ {
2803
+ "epoch": 1.8940316686967114,
2804
+ "grad_norm": 0.5963588356971741,
2805
+ "learning_rate": 7.694363141989575e-05,
2806
+ "loss": 0.658,
2807
+ "mean_token_accuracy": 0.8182344615459443,
2808
+ "num_tokens": 41846600.0,
2809
+ "step": 3110
2810
+ },
2811
+ {
2812
+ "epoch": 1.900121802679659,
2813
+ "grad_norm": 0.6149535775184631,
2814
+ "learning_rate": 7.639395002275827e-05,
2815
+ "loss": 0.6499,
2816
+ "mean_token_accuracy": 0.8208124756813049,
2817
+ "num_tokens": 41977627.0,
2818
+ "step": 3120
2819
+ },
2820
+ {
2821
+ "epoch": 1.9062119366626065,
2822
+ "grad_norm": 0.5739808678627014,
2823
+ "learning_rate": 7.584572148425544e-05,
2824
+ "loss": 0.6703,
2825
+ "mean_token_accuracy": 0.8125967502593994,
2826
+ "num_tokens": 42104510.0,
2827
+ "step": 3130
2828
+ },
2829
+ {
2830
+ "epoch": 1.9123020706455542,
2831
+ "grad_norm": 0.5982648730278015,
2832
+ "learning_rate": 7.529896950543416e-05,
2833
+ "loss": 0.6513,
2834
+ "mean_token_accuracy": 0.8201186507940292,
2835
+ "num_tokens": 42236168.0,
2836
+ "step": 3140
2837
+ },
2838
+ {
2839
+ "epoch": 1.9183922046285018,
2840
+ "grad_norm": 0.5896486043930054,
2841
+ "learning_rate": 7.475371772350658e-05,
2842
+ "loss": 0.6133,
2843
+ "mean_token_accuracy": 0.8260134413838387,
2844
+ "num_tokens": 42375086.0,
2845
+ "step": 3150
2846
+ },
2847
+ {
2848
+ "epoch": 1.9244823386114494,
2849
+ "grad_norm": 0.6223361492156982,
2850
+ "learning_rate": 7.420998971082833e-05,
2851
+ "loss": 0.6638,
2852
+ "mean_token_accuracy": 0.8162963137030601,
2853
+ "num_tokens": 42506457.0,
2854
+ "step": 3160
2855
+ },
2856
+ {
2857
+ "epoch": 1.9305724725943971,
2858
+ "grad_norm": 0.709854245185852,
2859
+ "learning_rate": 7.366780897387924e-05,
2860
+ "loss": 0.6324,
2861
+ "mean_token_accuracy": 0.8247174829244613,
2862
+ "num_tokens": 42640886.0,
2863
+ "step": 3170
2864
+ },
2865
+ {
2866
+ "epoch": 1.9366626065773447,
2867
+ "grad_norm": 0.6794169545173645,
2868
+ "learning_rate": 7.312719895224736e-05,
2869
+ "loss": 0.6164,
2870
+ "mean_token_accuracy": 0.82676922082901,
2871
+ "num_tokens": 42781318.0,
2872
+ "step": 3180
2873
+ },
2874
+ {
2875
+ "epoch": 1.9427527405602922,
2876
+ "grad_norm": 0.49305981397628784,
2877
+ "learning_rate": 7.258818301761532e-05,
2878
+ "loss": 0.6216,
2879
+ "mean_token_accuracy": 0.8258268669247627,
2880
+ "num_tokens": 42919381.0,
2881
+ "step": 3190
2882
+ },
2883
+ {
2884
+ "epoch": 1.94884287454324,
2885
+ "grad_norm": 0.5072576999664307,
2886
+ "learning_rate": 7.205078447275031e-05,
2887
+ "loss": 0.6407,
2888
+ "mean_token_accuracy": 0.819316141307354,
2889
+ "num_tokens": 43056494.0,
2890
+ "step": 3200
2891
+ },
2892
+ {
2893
+ "epoch": 1.9549330085261876,
2894
+ "grad_norm": 0.6188381314277649,
2895
+ "learning_rate": 7.151502655049623e-05,
2896
+ "loss": 0.6022,
2897
+ "mean_token_accuracy": 0.8328602254390717,
2898
+ "num_tokens": 43197795.0,
2899
+ "step": 3210
2900
+ },
2901
+ {
2902
+ "epoch": 1.9610231425091351,
2903
+ "grad_norm": 0.5626131296157837,
2904
+ "learning_rate": 7.098093241276962e-05,
2905
+ "loss": 0.6245,
2906
+ "mean_token_accuracy": 0.8258091285824776,
2907
+ "num_tokens": 43340325.0,
2908
+ "step": 3220
2909
+ },
2910
+ {
2911
+ "epoch": 1.967113276492083,
2912
+ "grad_norm": 0.5364338755607605,
2913
+ "learning_rate": 7.044852514955816e-05,
2914
+ "loss": 0.6454,
2915
+ "mean_token_accuracy": 0.8199462234973908,
2916
+ "num_tokens": 43472226.0,
2917
+ "step": 3230
2918
+ },
2919
+ {
2920
+ "epoch": 1.9732034104750305,
2921
+ "grad_norm": 0.5460382699966431,
2922
+ "learning_rate": 6.991782777792244e-05,
2923
+ "loss": 0.6214,
2924
+ "mean_token_accuracy": 0.8251617640256882,
2925
+ "num_tokens": 43609559.0,
2926
+ "step": 3240
2927
+ },
2928
+ {
2929
+ "epoch": 1.979293544457978,
2930
+ "grad_norm": 0.6013203263282776,
2931
+ "learning_rate": 6.938886324100097e-05,
2932
+ "loss": 0.6422,
2933
+ "mean_token_accuracy": 0.8197862133383751,
2934
+ "num_tokens": 43743060.0,
2935
+ "step": 3250
2936
+ },
2937
+ {
2938
+ "epoch": 1.9853836784409258,
2939
+ "grad_norm": 0.6688512563705444,
2940
+ "learning_rate": 6.88616544070182e-05,
2941
+ "loss": 0.6447,
2942
+ "mean_token_accuracy": 0.820338460803032,
2943
+ "num_tokens": 43876874.0,
2944
+ "step": 3260
2945
+ },
2946
+ {
2947
+ "epoch": 1.9914738124238733,
2948
+ "grad_norm": 0.6146946549415588,
2949
+ "learning_rate": 6.8336224068296e-05,
2950
+ "loss": 0.6015,
2951
+ "mean_token_accuracy": 0.8318811848759651,
2952
+ "num_tokens": 44021963.0,
2953
+ "step": 3270
2954
+ },
2955
+ {
2956
+ "epoch": 1.997563946406821,
2957
+ "grad_norm": 0.5972597599029541,
2958
+ "learning_rate": 6.781259494026821e-05,
2959
+ "loss": 0.6094,
2960
+ "mean_token_accuracy": 0.8282003849744797,
2961
+ "num_tokens": 44159207.0,
2962
+ "step": 3280
2963
+ }
2964
+ ],
2965
+ "logging_steps": 10,
2966
+ "max_steps": 4926,
2967
+ "num_input_tokens_seen": 0,
2968
+ "num_train_epochs": 3,
2969
+ "save_steps": 500,
2970
+ "stateful_callbacks": {
2971
+ "TrainerControl": {
2972
+ "args": {
2973
+ "should_epoch_stop": false,
2974
+ "should_evaluate": false,
2975
+ "should_log": false,
2976
+ "should_save": true,
2977
+ "should_training_stop": false
2978
+ },
2979
+ "attributes": {}
2980
+ }
2981
+ },
2982
+ "total_flos": 5.398768566923166e+18,
2983
+ "train_batch_size": 1,
2984
+ "trial_name": null,
2985
+ "trial_params": null
2986
+ }
checkpoint-3284/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d57fe99d74b7e16ba38edb5265078ef5a69a65f6b630b2ca3feaacdb770f49e
3
+ size 6161
checkpoint-4926/README.md ADDED
@@ -0,0 +1,208 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: openai/gpt-oss-20b
3
+ library_name: peft
4
+ tags:
5
+ - base_model:adapter:openai/gpt-oss-20b
6
+ - lora
7
+ - sft
8
+ - transformers
9
+ - trl
10
+ ---
11
+
12
+ # Model Card for Model ID
13
+
14
+ <!-- Provide a quick summary of what the model is/does. -->
15
+
16
+
17
+
18
+ ## Model Details
19
+
20
+ ### Model Description
21
+
22
+ <!-- Provide a longer summary of what this model is. -->
23
+
24
+
25
+
26
+ - **Developed by:** [More Information Needed]
27
+ - **Funded by [optional]:** [More Information Needed]
28
+ - **Shared by [optional]:** [More Information Needed]
29
+ - **Model type:** [More Information Needed]
30
+ - **Language(s) (NLP):** [More Information Needed]
31
+ - **License:** [More Information Needed]
32
+ - **Finetuned from model [optional]:** [More Information Needed]
33
+
34
+ ### Model Sources [optional]
35
+
36
+ <!-- Provide the basic links for the model. -->
37
+
38
+ - **Repository:** [More Information Needed]
39
+ - **Paper [optional]:** [More Information Needed]
40
+ - **Demo [optional]:** [More Information Needed]
41
+
42
+ ## Uses
43
+
44
+ <!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
45
+
46
+ ### Direct Use
47
+
48
+ <!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
49
+
50
+ [More Information Needed]
51
+
52
+ ### Downstream Use [optional]
53
+
54
+ <!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
55
+
56
+ [More Information Needed]
57
+
58
+ ### Out-of-Scope Use
59
+
60
+ <!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
61
+
62
+ [More Information Needed]
63
+
64
+ ## Bias, Risks, and Limitations
65
+
66
+ <!-- This section is meant to convey both technical and sociotechnical limitations. -->
67
+
68
+ [More Information Needed]
69
+
70
+ ### Recommendations
71
+
72
+ <!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
73
+
74
+ Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
75
+
76
+ ## How to Get Started with the Model
77
+
78
+ Use the code below to get started with the model.
79
+
80
+ [More Information Needed]
81
+
82
+ ## Training Details
83
+
84
+ ### Training Data
85
+
86
+ <!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
87
+
88
+ [More Information Needed]
89
+
90
+ ### Training Procedure
91
+
92
+ <!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
93
+
94
+ #### Preprocessing [optional]
95
+
96
+ [More Information Needed]
97
+
98
+
99
+ #### Training Hyperparameters
100
+
101
+ - **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
102
+
103
+ #### Speeds, Sizes, Times [optional]
104
+
105
+ <!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
106
+
107
+ [More Information Needed]
108
+
109
+ ## Evaluation
110
+
111
+ <!-- This section describes the evaluation protocols and provides the results. -->
112
+
113
+ ### Testing Data, Factors & Metrics
114
+
115
+ #### Testing Data
116
+
117
+ <!-- This should link to a Dataset Card if possible. -->
118
+
119
+ [More Information Needed]
120
+
121
+ #### Factors
122
+
123
+ <!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
124
+
125
+ [More Information Needed]
126
+
127
+ #### Metrics
128
+
129
+ <!-- These are the evaluation metrics being used, ideally with a description of why. -->
130
+
131
+ [More Information Needed]
132
+
133
+ ### Results
134
+
135
+ [More Information Needed]
136
+
137
+ #### Summary
138
+
139
+
140
+
141
+ ## Model Examination [optional]
142
+
143
+ <!-- Relevant interpretability work for the model goes here -->
144
+
145
+ [More Information Needed]
146
+
147
+ ## Environmental Impact
148
+
149
+ <!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
150
+
151
+ Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
152
+
153
+ - **Hardware Type:** [More Information Needed]
154
+ - **Hours used:** [More Information Needed]
155
+ - **Cloud Provider:** [More Information Needed]
156
+ - **Compute Region:** [More Information Needed]
157
+ - **Carbon Emitted:** [More Information Needed]
158
+
159
+ ## Technical Specifications [optional]
160
+
161
+ ### Model Architecture and Objective
162
+
163
+ [More Information Needed]
164
+
165
+ ### Compute Infrastructure
166
+
167
+ [More Information Needed]
168
+
169
+ #### Hardware
170
+
171
+ [More Information Needed]
172
+
173
+ #### Software
174
+
175
+ [More Information Needed]
176
+
177
+ ## Citation [optional]
178
+
179
+ <!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
180
+
181
+ **BibTeX:**
182
+
183
+ [More Information Needed]
184
+
185
+ **APA:**
186
+
187
+ [More Information Needed]
188
+
189
+ ## Glossary [optional]
190
+
191
+ <!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
192
+
193
+ [More Information Needed]
194
+
195
+ ## More Information [optional]
196
+
197
+ [More Information Needed]
198
+
199
+ ## Model Card Authors [optional]
200
+
201
+ [More Information Needed]
202
+
203
+ ## Model Card Contact
204
+
205
+ [More Information Needed]
206
+ ### Framework versions
207
+
208
+ - PEFT 0.17.1
checkpoint-4926/adapter_config.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": {
4
+ "base_model_class": "GptOssForCausalLM",
5
+ "parent_library": "transformers.models.gpt_oss.modeling_gpt_oss"
6
+ },
7
+ "base_model_name_or_path": "openai/gpt-oss-20b",
8
+ "bias": "none",
9
+ "corda_config": null,
10
+ "eva_config": null,
11
+ "exclude_modules": null,
12
+ "fan_in_fan_out": false,
13
+ "inference_mode": true,
14
+ "init_lora_weights": true,
15
+ "layer_replication": null,
16
+ "layers_pattern": null,
17
+ "layers_to_transform": null,
18
+ "loftq_config": {},
19
+ "lora_alpha": 16,
20
+ "lora_bias": false,
21
+ "lora_dropout": 0.0,
22
+ "megatron_config": null,
23
+ "megatron_core": "megatron.core",
24
+ "modules_to_save": null,
25
+ "peft_type": "LORA",
26
+ "qalora_group_size": 16,
27
+ "r": 8,
28
+ "rank_pattern": {},
29
+ "revision": null,
30
+ "target_modules": [
31
+ "o_proj",
32
+ "k_proj",
33
+ "v_proj",
34
+ "q_proj"
35
+ ],
36
+ "target_parameters": [
37
+ "7.mlp.experts.gate_up_proj",
38
+ "7.mlp.experts.down_proj",
39
+ "15.mlp.experts.gate_up_proj",
40
+ "15.mlp.experts.down_proj",
41
+ "23.mlp.experts.gate_up_proj",
42
+ "23.mlp.experts.down_proj"
43
+ ],
44
+ "task_type": null,
45
+ "trainable_token_indices": null,
46
+ "use_dora": false,
47
+ "use_qalora": false,
48
+ "use_rslora": false
49
+ }
checkpoint-4926/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a12fc000b95c82bac6a99a48756a04e45988fdbd7cf08e8fc7d3059abbcb8677
3
+ size 2366470368
checkpoint-4926/chat_template.jinja ADDED
@@ -0,0 +1,331 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {#-
2
+ In addition to the normal inputs of `messages` and `tools`, this template also accepts the
3
+ following kwargs:
4
+ - "builtin_tools": A list, can contain "browser" and/or "python".
5
+ - "model_identity": A string that optionally describes the model identity.
6
+ - "reasoning_effort": A string that describes the reasoning effort, defaults to "medium".
7
+ #}
8
+
9
+ {#- Tool Definition Rendering ============================================== #}
10
+ {%- macro render_typescript_type(param_spec, required_params, is_nullable=false) -%}
11
+ {%- if param_spec.type == "array" -%}
12
+ {%- if param_spec['items'] -%}
13
+ {%- if param_spec['items']['type'] == "string" -%}
14
+ {{- "string[]" }}
15
+ {%- elif param_spec['items']['type'] == "number" -%}
16
+ {{- "number[]" }}
17
+ {%- elif param_spec['items']['type'] == "integer" -%}
18
+ {{- "number[]" }}
19
+ {%- elif param_spec['items']['type'] == "boolean" -%}
20
+ {{- "boolean[]" }}
21
+ {%- else -%}
22
+ {%- set inner_type = render_typescript_type(param_spec['items'], required_params) -%}
23
+ {%- if inner_type == "object | object" or inner_type|length > 50 -%}
24
+ {{- "any[]" }}
25
+ {%- else -%}
26
+ {{- inner_type + "[]" }}
27
+ {%- endif -%}
28
+ {%- endif -%}
29
+ {%- if param_spec.nullable -%}
30
+ {{- " | null" }}
31
+ {%- endif -%}
32
+ {%- else -%}
33
+ {{- "any[]" }}
34
+ {%- if param_spec.nullable -%}
35
+ {{- " | null" }}
36
+ {%- endif -%}
37
+ {%- endif -%}
38
+ {%- elif param_spec.type is defined and param_spec.type is iterable and param_spec.type is not string and param_spec.type is not mapping and param_spec.type[0] is defined -%}
39
+ {#- Handle array of types like ["object", "object"] from Union[dict, list] #}
40
+ {%- if param_spec.type | length > 1 -%}
41
+ {{- param_spec.type | join(" | ") }}
42
+ {%- else -%}
43
+ {{- param_spec.type[0] }}
44
+ {%- endif -%}
45
+ {%- elif param_spec.oneOf -%}
46
+ {#- Handle oneOf schemas - check for complex unions and fallback to any #}
47
+ {%- set has_object_variants = false -%}
48
+ {%- for variant in param_spec.oneOf -%}
49
+ {%- if variant.type == "object" -%}
50
+ {%- set has_object_variants = true -%}
51
+ {%- endif -%}
52
+ {%- endfor -%}
53
+ {%- if has_object_variants and param_spec.oneOf|length > 1 -%}
54
+ {{- "any" }}
55
+ {%- else -%}
56
+ {%- for variant in param_spec.oneOf -%}
57
+ {{- render_typescript_type(variant, required_params) -}}
58
+ {%- if variant.description %}
59
+ {{- "// " + variant.description }}
60
+ {%- endif -%}
61
+ {%- if variant.default is defined %}
62
+ {{ "// default: " + variant.default|tojson }}
63
+ {%- endif -%}
64
+ {%- if not loop.last %}
65
+ {{- " | " }}
66
+ {% endif -%}
67
+ {%- endfor -%}
68
+ {%- endif -%}
69
+ {%- elif param_spec.type == "string" -%}
70
+ {%- if param_spec.enum -%}
71
+ {{- '"' + param_spec.enum|join('" | "') + '"' -}}
72
+ {%- else -%}
73
+ {{- "string" }}
74
+ {%- if param_spec.nullable %}
75
+ {{- " | null" }}
76
+ {%- endif -%}
77
+ {%- endif -%}
78
+ {%- elif param_spec.type == "number" -%}
79
+ {{- "number" }}
80
+ {%- elif param_spec.type == "integer" -%}
81
+ {{- "number" }}
82
+ {%- elif param_spec.type == "boolean" -%}
83
+ {{- "boolean" }}
84
+
85
+ {%- elif param_spec.type == "object" -%}
86
+ {%- if param_spec.properties -%}
87
+ {{- "{\n" }}
88
+ {%- for prop_name, prop_spec in param_spec.properties.items() -%}
89
+ {{- prop_name -}}
90
+ {%- if prop_name not in (param_spec.required or []) -%}
91
+ {{- "?" }}
92
+ {%- endif -%}
93
+ {{- ": " }}
94
+ {{ render_typescript_type(prop_spec, param_spec.required or []) }}
95
+ {%- if not loop.last -%}
96
+ {{-", " }}
97
+ {%- endif -%}
98
+ {%- endfor -%}
99
+ {{- "}" }}
100
+ {%- else -%}
101
+ {{- "object" }}
102
+ {%- endif -%}
103
+ {%- else -%}
104
+ {{- "any" }}
105
+ {%- endif -%}
106
+ {%- endmacro -%}
107
+
108
+ {%- macro render_tool_namespace(namespace_name, tools) -%}
109
+ {{- "## " + namespace_name + "\n\n" }}
110
+ {{- "namespace " + namespace_name + " {\n\n" }}
111
+ {%- for tool in tools %}
112
+ {%- set tool = tool.function %}
113
+ {{- "// " + tool.description + "\n" }}
114
+ {{- "type "+ tool.name + " = " }}
115
+ {%- if tool.parameters and tool.parameters.properties %}
116
+ {{- "(_: {\n" }}
117
+ {%- for param_name, param_spec in tool.parameters.properties.items() %}
118
+ {%- if param_spec.description %}
119
+ {{- "// " + param_spec.description + "\n" }}
120
+ {%- endif %}
121
+ {{- param_name }}
122
+ {%- if param_name not in (tool.parameters.required or []) -%}
123
+ {{- "?" }}
124
+ {%- endif -%}
125
+ {{- ": " }}
126
+ {{- render_typescript_type(param_spec, tool.parameters.required or []) }}
127
+ {%- if param_spec.default is defined -%}
128
+ {%- if param_spec.enum %}
129
+ {{- ", // default: " + param_spec.default }}
130
+ {%- elif param_spec.oneOf %}
131
+ {{- "// default: " + param_spec.default }}
132
+ {%- else %}
133
+ {{- ", // default: " + param_spec.default|tojson }}
134
+ {%- endif -%}
135
+ {%- endif -%}
136
+ {%- if not loop.last %}
137
+ {{- ",\n" }}
138
+ {%- else %}
139
+ {{- ",\n" }}
140
+ {%- endif -%}
141
+ {%- endfor %}
142
+ {{- "}) => any;\n\n" }}
143
+ {%- else -%}
144
+ {{- "() => any;\n\n" }}
145
+ {%- endif -%}
146
+ {%- endfor %}
147
+ {{- "} // namespace " + namespace_name }}
148
+ {%- endmacro -%}
149
+
150
+ {%- macro render_builtin_tools(browser_tool, python_tool) -%}
151
+ {%- if browser_tool %}
152
+ {{- "## browser\n\n" }}
153
+ {{- "// Tool for browsing.\n" }}
154
+ {{- "// The `cursor` appears in brackets before each browsing display: `[{cursor}]`.\n" }}
155
+ {{- "// Cite information from the tool using the following format:\n" }}
156
+ {{- "// `【{cursor}†L{line_start}(-L{line_end})?】`, for example: `【6†L9-L11】` or `【8†L3】`.\n" }}
157
+ {{- "// Do not quote more than 10 words directly from the tool output.\n" }}
158
+ {{- "// sources=web (default: web)\n" }}
159
+ {{- "namespace browser {\n\n" }}
160
+ {{- "// Searches for information related to `query` and displays `topn` results.\n" }}
161
+ {{- "type search = (_: {\n" }}
162
+ {{- "query: string,\n" }}
163
+ {{- "topn?: number, // default: 10\n" }}
164
+ {{- "source?: string,\n" }}
165
+ {{- "}) => any;\n\n" }}
166
+ {{- "// Opens the link `id` from the page indicated by `cursor` starting at line number `loc`, showing `num_lines` lines.\n" }}
167
+ {{- "// Valid link ids are displayed with the formatting: `【{id}†.*】`.\n" }}
168
+ {{- "// If `cursor` is not provided, the most recent page is implied.\n" }}
169
+ {{- "// If `id` is a string, it is treated as a fully qualified URL associated with `source`.\n" }}
170
+ {{- "// If `loc` is not provided, the viewport will be positioned at the beginning of the document or centered on the most relevant passage, if available.\n" }}
171
+ {{- "// Use this function without `id` to scroll to a new location of an opened page.\n" }}
172
+ {{- "type open = (_: {\n" }}
173
+ {{- "id?: number | string, // default: -1\n" }}
174
+ {{- "cursor?: number, // default: -1\n" }}
175
+ {{- "loc?: number, // default: -1\n" }}
176
+ {{- "num_lines?: number, // default: -1\n" }}
177
+ {{- "view_source?: boolean, // default: false\n" }}
178
+ {{- "source?: string,\n" }}
179
+ {{- "}) => any;\n\n" }}
180
+ {{- "// Finds exact matches of `pattern` in the current page, or the page given by `cursor`.\n" }}
181
+ {{- "type find = (_: {\n" }}
182
+ {{- "pattern: string,\n" }}
183
+ {{- "cursor?: number, // default: -1\n" }}
184
+ {{- "}) => any;\n\n" }}
185
+ {{- "} // namespace browser\n\n" }}
186
+ {%- endif -%}
187
+
188
+ {%- if python_tool %}
189
+ {{- "## python\n\n" }}
190
+ {{- "Use this tool to execute Python code in your chain of thought. The code will not be shown to the user. This tool should be used for internal reasoning, but not for code that is intended to be visible to the user (e.g. when creating plots, tables, or files).\n\n" }}
191
+ {{- "When you send a message containing Python code to python, it will be executed in a stateful Jupyter notebook environment. python will respond with the output of the execution or time out after 120.0 seconds. The drive at '/mnt/data' can be used to save and persist user files. Internet access for this session is UNKNOWN. Depends on the cluster.\n\n" }}
192
+ {%- endif -%}
193
+ {%- endmacro -%}
194
+
195
+ {#- System Message Construction ============================================ #}
196
+ {%- macro build_system_message() -%}
197
+ {%- if model_identity is not defined %}
198
+ {%- set model_identity = "You are ChatGPT, a large language model trained by OpenAI." %}
199
+ {%- endif %}
200
+ {{- model_identity + "\n" }}
201
+ {{- "Knowledge cutoff: 2024-06\n" }}
202
+ {{- "Current date: " + strftime_now("%Y-%m-%d") + "\n\n" }}
203
+ {%- if reasoning_effort is not defined %}
204
+ {%- set reasoning_effort = "medium" %}
205
+ {%- endif %}
206
+ {{- "Reasoning: " + reasoning_effort + "\n\n" }}
207
+ {%- if builtin_tools %}
208
+ {{- "# Tools\n\n" }}
209
+ {%- set available_builtin_tools = namespace(browser=false, python=false) %}
210
+ {%- for tool in builtin_tools %}
211
+ {%- if tool == "browser" %}
212
+ {%- set available_builtin_tools.browser = true %}
213
+ {%- elif tool == "python" %}
214
+ {%- set available_builtin_tools.python = true %}
215
+ {%- endif %}
216
+ {%- endfor %}
217
+ {{- render_builtin_tools(available_builtin_tools.browser, available_builtin_tools.python) }}
218
+ {%- endif -%}
219
+ {{- "# Valid channels: analysis, commentary, final. Channel must be included for every message." }}
220
+ {%- if tools -%}
221
+ {{- "\nCalls to these tools must go to the commentary channel: 'functions'." }}
222
+ {%- endif -%}
223
+ {%- endmacro -%}
224
+
225
+ {#- Main Template Logic ================================================= #}
226
+ {#- Set defaults #}
227
+
228
+ {#- Render system message #}
229
+ {{- "<|start|>system<|message|>" }}
230
+ {{- build_system_message() }}
231
+ {{- "<|end|>" }}
232
+
233
+ {#- Extract developer message #}
234
+ {%- if messages[0].role == "developer" or messages[0].role == "system" %}
235
+ {%- set developer_message = messages[0].content %}
236
+ {%- set loop_messages = messages[1:] %}
237
+ {%- else %}
238
+ {%- set developer_message = "" %}
239
+ {%- set loop_messages = messages %}
240
+ {%- endif %}
241
+
242
+ {#- Render developer message #}
243
+ {%- if developer_message or tools %}
244
+ {{- "<|start|>developer<|message|>" }}
245
+ {%- if developer_message %}
246
+ {{- "# Instructions\n\n" }}
247
+ {{- developer_message }}
248
+ {{- "\n\n" }}
249
+ {%- endif %}
250
+ {%- if tools -%}
251
+ {{- "# Tools\n\n" }}
252
+ {{- render_tool_namespace("functions", tools) }}
253
+ {%- endif -%}
254
+ {{- "<|end|>" }}
255
+ {%- endif %}
256
+
257
+ {#- Render messages #}
258
+ {%- set last_tool_call = namespace(name=none) %}
259
+ {%- for message in loop_messages -%}
260
+ {#- At this point only assistant/user/tool messages should remain #}
261
+ {%- if message.role == 'assistant' -%}
262
+ {#- Checks to ensure the messages are being passed in the format we expect #}
263
+ {%- if "content" in message %}
264
+ {%- if "<|channel|>analysis<|message|>" in message.content or "<|channel|>final<|message|>" in message.content %}
265
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the content field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
266
+ {%- endif %}
267
+ {%- endif %}
268
+ {%- if "thinking" in message %}
269
+ {%- if "<|channel|>analysis<|message|>" in message.thinking or "<|channel|>final<|message|>" in message.thinking %}
270
+ {{- raise_exception("You have passed a message containing <|channel|> tags in the thinking field. Instead of doing this, you should pass analysis messages (the string between '<|message|>' and '<|end|>') in the 'thinking' field, and final messages (the string between '<|message|>' and '<|end|>') in the 'content' field.") }}
271
+ {%- endif %}
272
+ {%- endif %}
273
+ {%- if "tool_calls" in message %}
274
+ {#- We need very careful handling here - we want to drop the tool call analysis message if the model #}
275
+ {#- has output a later <|final|> message, but otherwise we want to retain it. This is the only case #}
276
+ {#- when we render CoT/analysis messages in inference. #}
277
+ {%- set future_final_message = namespace(found=false) %}
278
+ {%- for future_message in loop_messages[loop.index:] %}
279
+ {%- if future_message.role == 'assistant' and "tool_calls" not in future_message %}
280
+ {%- set future_final_message.found = true %}
281
+ {%- endif %}
282
+ {%- endfor %}
283
+ {#- We assume max 1 tool call per message, and so we infer the tool call name #}
284
+ {#- in "tool" messages from the most recent assistant tool call name #}
285
+ {%- set tool_call = message.tool_calls[0] %}
286
+ {%- if tool_call.function %}
287
+ {%- set tool_call = tool_call.function %}
288
+ {%- endif %}
289
+ {%- if message.content and message.thinking %}
290
+ {{- raise_exception("Cannot pass both content and thinking in an assistant message with tool calls! Put the analysis message in one or the other, but not both.") }}
291
+ {%- elif message.content and not future_final_message.found %}
292
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.content + "<|end|>" }}
293
+ {%- elif message.thinking and not future_final_message.found %}
294
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
295
+ {%- endif %}
296
+ {{- "<|start|>assistant to=" }}
297
+ {{- "functions." + tool_call.name + "<|channel|>commentary " }}
298
+ {{- (tool_call.content_type if tool_call.content_type is defined else "json") + "<|message|>" }}
299
+ {{- tool_call.arguments|tojson }}
300
+ {{- "<|call|>" }}
301
+ {%- set last_tool_call.name = tool_call.name %}
302
+ {%- elif loop.last and not add_generation_prompt %}
303
+ {#- Only render the CoT if the final turn is an assistant turn and add_generation_prompt is false #}
304
+ {#- This is a situation that should only occur in training, never in inference. #}
305
+ {%- if "thinking" in message %}
306
+ {{- "<|start|>assistant<|channel|>analysis<|message|>" + message.thinking + "<|end|>" }}
307
+ {%- endif %}
308
+ {#- <|return|> indicates the end of generation, but <|end|> does not #}
309
+ {#- <|return|> should never be an input to the model, but we include it as the final token #}
310
+ {#- when training, so the model learns to emit it. #}
311
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|return|>" }}
312
+ {%- else %}
313
+ {#- CoT is dropped during all previous turns, so we never render it for inference #}
314
+ {{- "<|start|>assistant<|channel|>final<|message|>" + message.content + "<|end|>" }}
315
+ {%- set last_tool_call.name = none %}
316
+ {%- endif %}
317
+ {%- elif message.role == 'tool' -%}
318
+ {%- if last_tool_call.name is none %}
319
+ {{- raise_exception("Message has tool role, but there was no previous assistant message with a tool call!") }}
320
+ {%- endif %}
321
+ {{- "<|start|>functions." + last_tool_call.name }}
322
+ {{- " to=assistant<|channel|>commentary<|message|>" + message.content|tojson + "<|end|>" }}
323
+ {%- elif message.role == 'user' -%}
324
+ {{- "<|start|>user<|message|>" + message.content + "<|end|>" }}
325
+ {%- endif -%}
326
+ {%- endfor -%}
327
+
328
+ {#- Generation prompt #}
329
+ {%- if add_generation_prompt -%}
330
+ <|start|>assistant
331
+ {%- endif -%}
checkpoint-4926/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c968d107bcfa844e488d2039804f39daa06485d721080be175306ae5d96751c5
3
+ size 120495883
checkpoint-4926/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b093dfe59b41efeb45cc3d628d3360abaa2303bbaa489081411faf431e52941d
3
+ size 16389
checkpoint-4926/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:450a0ac1645503c0b14fe9c37d77060cc76b1c9942dcfdd0e779cd526b2e98d9
3
+ size 16389