diff --git a/13B-ollama/anysecret-assistant-13B-Q4_K_M.gguf b/13B-ollama/anysecret-assistant-13B-Q4_K_M.gguf
deleted file mode 100644
index 1989cfc6c3c4f52887e58fa6ca4fcd66f5814171..0000000000000000000000000000000000000000
--- a/13B-ollama/anysecret-assistant-13B-Q4_K_M.gguf
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f635699554afee39a40c05ddd8f9dc35ecfc9b31c754d6849c805d98128d3641
-size 7866071424
diff --git a/13B-ollama/anysecret-assistant-13B-Q5_K_M.gguf b/13B-ollama/anysecret-assistant-13B-Q5_K_M.gguf
deleted file mode 100644
index 26b0b975dfdd66f87410a3a45fbed04114ebca9f..0000000000000000000000000000000000000000
--- a/13B-ollama/anysecret-assistant-13B-Q5_K_M.gguf
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:ca7857afe8908510859f7f6fe18232a1efa93fe7dac0e6b0c177b2f6895fe5df
-size 9230049664
diff --git a/13B-ollama/anysecret-assistant-13B-Q8_0.gguf b/13B-ollama/anysecret-assistant-13B-Q8_0.gguf
deleted file mode 100644
index 1921ad47a2bf21bc298e9752917b2145391f58a3..0000000000000000000000000000000000000000
--- a/13B-ollama/anysecret-assistant-13B-Q8_0.gguf
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7c1c6ffab8eb447d2da08ce7cb2f70c398d9dd69ea509ae6f1f98aad33c410b6
-size 13831495424
diff --git a/adapter_config.json b/adapter_config.json
deleted file mode 100644
index 2a47c2409fcec449ecdbcdde4b38627e50b56a0b..0000000000000000000000000000000000000000
--- a/adapter_config.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
- "alpha_pattern": {},
- "auto_mapping": null,
- "base_model_name_or_path": "codellama/CodeLlama-13b-Instruct-hf",
- "bias": "none",
- "corda_config": null,
- "eva_config": null,
- "exclude_modules": null,
- "fan_in_fan_out": false,
- "inference_mode": true,
- "init_lora_weights": true,
- "layer_replication": null,
- "layers_pattern": null,
- "layers_to_transform": null,
- "loftq_config": {},
- "lora_alpha": 32,
- "lora_bias": false,
- "lora_dropout": 0.1,
- "megatron_config": null,
- "megatron_core": "megatron.core",
- "modules_to_save": null,
- "peft_type": "LORA",
- "qalora_group_size": 16,
- "r": 16,
- "rank_pattern": {},
- "revision": null,
- "target_modules": [
- "up_proj",
- "o_proj",
- "gate_proj",
- "down_proj",
- "k_proj",
- "q_proj",
- "v_proj"
- ],
- "target_parameters": null,
- "task_type": "CAUSAL_LM",
- "trainable_token_indices": null,
- "use_dora": false,
- "use_qalora": false,
- "use_rslora": false
-}
\ No newline at end of file
diff --git a/adapter_model.safetensors b/adapter_model.safetensors
deleted file mode 100644
index fe216c6a898cbd86be20675259ac5e461d2ca362..0000000000000000000000000000000000000000
--- a/adapter_model.safetensors
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:491a381f62798faedfe204bdaf00433d1efc35b1a9ec968f59030ebe507aa61a
-size 250422888
diff --git a/chat_template.jinja b/chat_template.jinja
deleted file mode 100644
index 21dba1af1b9154e9140fe0ef5ca06d011b5004c8..0000000000000000000000000000000000000000
--- a/chat_template.jinja
+++ /dev/null
@@ -1 +0,0 @@
-{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}{% for message in loop_messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 and system_message != false %}{% set content = '<>\n' + system_message + '\n<>\n\n' + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ bos_token + '[INST] ' + content | trim + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content | trim + ' ' + eos_token }}{% endif %}{% endfor %}
\ No newline at end of file
diff --git a/checkpoint-100/README.md b/checkpoint-100/README.md
deleted file mode 100644
index da869e54abd54b0fea18dcc9516b16918f684370..0000000000000000000000000000000000000000
--- a/checkpoint-100/README.md
+++ /dev/null
@@ -1,207 +0,0 @@
----
-base_model: meta-llama/Llama-3.2-3B-Instruct
-library_name: peft
-pipeline_tag: text-generation
-tags:
-- base_model:adapter:meta-llama/Llama-3.2-3B-Instruct
-- lora
-- transformers
----
-
-# Model Card for Model ID
-
-
-
-
-
-## Model Details
-
-### Model Description
-
-
-
-
-
-- **Developed by:** [More Information Needed]
-- **Funded by [optional]:** [More Information Needed]
-- **Shared by [optional]:** [More Information Needed]
-- **Model type:** [More Information Needed]
-- **Language(s) (NLP):** [More Information Needed]
-- **License:** [More Information Needed]
-- **Finetuned from model [optional]:** [More Information Needed]
-
-### Model Sources [optional]
-
-
-
-- **Repository:** [More Information Needed]
-- **Paper [optional]:** [More Information Needed]
-- **Demo [optional]:** [More Information Needed]
-
-## Uses
-
-
-
-### Direct Use
-
-
-
-[More Information Needed]
-
-### Downstream Use [optional]
-
-
-
-[More Information Needed]
-
-### Out-of-Scope Use
-
-
-
-[More Information Needed]
-
-## Bias, Risks, and Limitations
-
-
-
-[More Information Needed]
-
-### Recommendations
-
-
-
-Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
-
-## How to Get Started with the Model
-
-Use the code below to get started with the model.
-
-[More Information Needed]
-
-## Training Details
-
-### Training Data
-
-
-
-[More Information Needed]
-
-### Training Procedure
-
-
-
-#### Preprocessing [optional]
-
-[More Information Needed]
-
-
-#### Training Hyperparameters
-
-- **Training regime:** [More Information Needed]
-
-#### Speeds, Sizes, Times [optional]
-
-
-
-[More Information Needed]
-
-## Evaluation
-
-
-
-### Testing Data, Factors & Metrics
-
-#### Testing Data
-
-
-
-[More Information Needed]
-
-#### Factors
-
-
-
-[More Information Needed]
-
-#### Metrics
-
-
-
-[More Information Needed]
-
-### Results
-
-[More Information Needed]
-
-#### Summary
-
-
-
-## Model Examination [optional]
-
-
-
-[More Information Needed]
-
-## Environmental Impact
-
-
-
-Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
-
-- **Hardware Type:** [More Information Needed]
-- **Hours used:** [More Information Needed]
-- **Cloud Provider:** [More Information Needed]
-- **Compute Region:** [More Information Needed]
-- **Carbon Emitted:** [More Information Needed]
-
-## Technical Specifications [optional]
-
-### Model Architecture and Objective
-
-[More Information Needed]
-
-### Compute Infrastructure
-
-[More Information Needed]
-
-#### Hardware
-
-[More Information Needed]
-
-#### Software
-
-[More Information Needed]
-
-## Citation [optional]
-
-
-
-**BibTeX:**
-
-[More Information Needed]
-
-**APA:**
-
-[More Information Needed]
-
-## Glossary [optional]
-
-
-
-[More Information Needed]
-
-## More Information [optional]
-
-[More Information Needed]
-
-## Model Card Authors [optional]
-
-[More Information Needed]
-
-## Model Card Contact
-
-[More Information Needed]
-### Framework versions
-
-- PEFT 0.17.1
\ No newline at end of file
diff --git a/checkpoint-100/adapter_config.json b/checkpoint-100/adapter_config.json
deleted file mode 100644
index c9a27d527a89fd0081c994e17bd2b908b8038d6e..0000000000000000000000000000000000000000
--- a/checkpoint-100/adapter_config.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
- "alpha_pattern": {},
- "auto_mapping": null,
- "base_model_name_or_path": "meta-llama/Llama-3.2-3B-Instruct",
- "bias": "none",
- "corda_config": null,
- "eva_config": null,
- "exclude_modules": null,
- "fan_in_fan_out": false,
- "inference_mode": true,
- "init_lora_weights": true,
- "layer_replication": null,
- "layers_pattern": null,
- "layers_to_transform": null,
- "loftq_config": {},
- "lora_alpha": 32,
- "lora_bias": false,
- "lora_dropout": 0.1,
- "megatron_config": null,
- "megatron_core": "megatron.core",
- "modules_to_save": null,
- "peft_type": "LORA",
- "qalora_group_size": 16,
- "r": 16,
- "rank_pattern": {},
- "revision": null,
- "target_modules": [
- "down_proj",
- "v_proj",
- "q_proj",
- "k_proj",
- "gate_proj",
- "o_proj",
- "up_proj"
- ],
- "target_parameters": null,
- "task_type": "CAUSAL_LM",
- "trainable_token_indices": null,
- "use_dora": false,
- "use_qalora": false,
- "use_rslora": false
-}
\ No newline at end of file
diff --git a/checkpoint-100/adapter_model.safetensors b/checkpoint-100/adapter_model.safetensors
deleted file mode 100644
index d0b49f3e9c4924545ee8d71a6a5c9740a61f4c6d..0000000000000000000000000000000000000000
--- a/checkpoint-100/adapter_model.safetensors
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:4fc6b553d80d4183d5a3cc772dccc582287021fa6ccce89b08c7e64930c0bdd5
-size 97307544
diff --git a/checkpoint-100/chat_template.jinja b/checkpoint-100/chat_template.jinja
deleted file mode 100644
index 1bad6a0f648dccdbec523ca79ba90fbcfc806af0..0000000000000000000000000000000000000000
--- a/checkpoint-100/chat_template.jinja
+++ /dev/null
@@ -1,93 +0,0 @@
-{{- bos_token }}
-{%- if custom_tools is defined %}
- {%- set tools = custom_tools %}
-{%- endif %}
-{%- if not tools_in_user_message is defined %}
- {%- set tools_in_user_message = true %}
-{%- endif %}
-{%- if not date_string is defined %}
- {%- if strftime_now is defined %}
- {%- set date_string = strftime_now("%d %b %Y") %}
- {%- else %}
- {%- set date_string = "26 Jul 2024" %}
- {%- endif %}
-{%- endif %}
-{%- if not tools is defined %}
- {%- set tools = none %}
-{%- endif %}
-
-{#- This block extracts the system message, so we can slot it into the right place. #}
-{%- if messages[0]['role'] == 'system' %}
- {%- set system_message = messages[0]['content']|trim %}
- {%- set messages = messages[1:] %}
-{%- else %}
- {%- set system_message = "" %}
-{%- endif %}
-
-{#- System message #}
-{{- "<|start_header_id|>system<|end_header_id|>\n\n" }}
-{%- if tools is not none %}
- {{- "Environment: ipython\n" }}
-{%- endif %}
-{{- "Cutting Knowledge Date: December 2023\n" }}
-{{- "Today Date: " + date_string + "\n\n" }}
-{%- if tools is not none and not tools_in_user_message %}
- {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
- {{- "Do not use variables.\n\n" }}
- {%- for t in tools %}
- {{- t | tojson(indent=4) }}
- {{- "\n\n" }}
- {%- endfor %}
-{%- endif %}
-{{- system_message }}
-{{- "<|eot_id|>" }}
-
-{#- Custom tools are passed in a user message with some extra guidance #}
-{%- if tools_in_user_message and not tools is none %}
- {#- Extract the first user message so we can plug it in here #}
- {%- if messages | length != 0 %}
- {%- set first_user_message = messages[0]['content']|trim %}
- {%- set messages = messages[1:] %}
- {%- else %}
- {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }}
-{%- endif %}
- {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}
- {{- "Given the following functions, please respond with a JSON for a function call " }}
- {{- "with its proper arguments that best answers the given prompt.\n\n" }}
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
- {{- "Do not use variables.\n\n" }}
- {%- for t in tools %}
- {{- t | tojson(indent=4) }}
- {{- "\n\n" }}
- {%- endfor %}
- {{- first_user_message + "<|eot_id|>"}}
-{%- endif %}
-
-{%- for message in messages %}
- {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}
- {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }}
- {%- elif 'tool_calls' in message %}
- {%- if not message.tool_calls|length == 1 %}
- {{- raise_exception("This model only supports single tool-calls at once!") }}
- {%- endif %}
- {%- set tool_call = message.tool_calls[0].function %}
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}
- {{- '{"name": "' + tool_call.name + '", ' }}
- {{- '"parameters": ' }}
- {{- tool_call.arguments | tojson }}
- {{- "}" }}
- {{- "<|eot_id|>" }}
- {%- elif message.role == "tool" or message.role == "ipython" %}
- {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }}
- {%- if message.content is mapping or message.content is iterable %}
- {{- message.content | tojson }}
- {%- else %}
- {{- message.content }}
- {%- endif %}
- {{- "<|eot_id|>" }}
- {%- endif %}
-{%- endfor %}
-{%- if add_generation_prompt %}
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}
-{%- endif %}
diff --git a/checkpoint-100/optimizer.pt b/checkpoint-100/optimizer.pt
deleted file mode 100644
index 499bf6f0c269ddfb669b3d7e82633252d2c09e8d..0000000000000000000000000000000000000000
--- a/checkpoint-100/optimizer.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f5a9c0ecb6f33b77d737e724fe719cc53e0d4cdf30efd01aaa73b310b58bf4ef
-size 194846331
diff --git a/checkpoint-100/rng_state.pth b/checkpoint-100/rng_state.pth
deleted file mode 100644
index ddf6f7dc00eefb78797f6a9017b7e05509310cbf..0000000000000000000000000000000000000000
--- a/checkpoint-100/rng_state.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:21eebf5c3ba6efdb5123bbdc37ec0bacf114ce7c5f26a6499a36b2a69fa2c90b
-size 14645
diff --git a/checkpoint-100/scaler.pt b/checkpoint-100/scaler.pt
deleted file mode 100644
index 215c5d2069bd81cb35727ebca07a510ac59c9d94..0000000000000000000000000000000000000000
--- a/checkpoint-100/scaler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c4393a84a3109995aa1202073b039b12062e3189ed89aa0b94ef0510ba843009
-size 1383
diff --git a/checkpoint-100/scheduler.pt b/checkpoint-100/scheduler.pt
deleted file mode 100644
index 02d20dbc6bab763333a8ca7033099cc160ac21c8..0000000000000000000000000000000000000000
--- a/checkpoint-100/scheduler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d244377f57e78c692ea998e9ce93a7160134e1a3af6a39359aedc2d2aa9940c5
-size 1465
diff --git a/checkpoint-100/special_tokens_map.json b/checkpoint-100/special_tokens_map.json
deleted file mode 100644
index b43be96621d147110fb8a18b5776ec6e38516127..0000000000000000000000000000000000000000
--- a/checkpoint-100/special_tokens_map.json
+++ /dev/null
@@ -1,17 +0,0 @@
-{
- "bos_token": {
- "content": "<|begin_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "eos_token": {
- "content": "<|eot_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "pad_token": "<|eot_id|>"
-}
diff --git a/checkpoint-100/tokenizer.json b/checkpoint-100/tokenizer.json
deleted file mode 100644
index 8e89913d63cf04862fcbf301032ee349780489f2..0000000000000000000000000000000000000000
--- a/checkpoint-100/tokenizer.json
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:912e72517f7521f3273166a7879fe54c52b397f8c48ea80f8f1ed794beb24c09
-size 17210184
diff --git a/checkpoint-100/tokenizer_config.json b/checkpoint-100/tokenizer_config.json
deleted file mode 100644
index 3beeacc86a6ca3cae14ad3004263ab74a4bac07a..0000000000000000000000000000000000000000
--- a/checkpoint-100/tokenizer_config.json
+++ /dev/null
@@ -1,2063 +0,0 @@
-{
- "added_tokens_decoder": {
- "128000": {
- "content": "<|begin_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128001": {
- "content": "<|end_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128002": {
- "content": "<|reserved_special_token_0|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128003": {
- "content": "<|reserved_special_token_1|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128004": {
- "content": "<|finetune_right_pad_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128005": {
- "content": "<|reserved_special_token_2|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128006": {
- "content": "<|start_header_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128007": {
- "content": "<|end_header_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128008": {
- "content": "<|eom_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128009": {
- "content": "<|eot_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128010": {
- "content": "<|python_tag|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128011": {
- "content": "<|reserved_special_token_3|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128012": {
- "content": "<|reserved_special_token_4|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128013": {
- "content": "<|reserved_special_token_5|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128014": {
- "content": "<|reserved_special_token_6|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128015": {
- "content": "<|reserved_special_token_7|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128016": {
- "content": "<|reserved_special_token_8|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128017": {
- "content": "<|reserved_special_token_9|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128018": {
- "content": "<|reserved_special_token_10|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128019": {
- "content": "<|reserved_special_token_11|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128020": {
- "content": "<|reserved_special_token_12|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128021": {
- "content": "<|reserved_special_token_13|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128022": {
- "content": "<|reserved_special_token_14|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128023": {
- "content": "<|reserved_special_token_15|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128024": {
- "content": "<|reserved_special_token_16|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128025": {
- "content": "<|reserved_special_token_17|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128026": {
- "content": "<|reserved_special_token_18|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128027": {
- "content": "<|reserved_special_token_19|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128028": {
- "content": "<|reserved_special_token_20|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128029": {
- "content": "<|reserved_special_token_21|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128030": {
- "content": "<|reserved_special_token_22|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128031": {
- "content": "<|reserved_special_token_23|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128032": {
- "content": "<|reserved_special_token_24|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128033": {
- "content": "<|reserved_special_token_25|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128034": {
- "content": "<|reserved_special_token_26|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128035": {
- "content": "<|reserved_special_token_27|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128036": {
- "content": "<|reserved_special_token_28|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128037": {
- "content": "<|reserved_special_token_29|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128038": {
- "content": "<|reserved_special_token_30|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128039": {
- "content": "<|reserved_special_token_31|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128040": {
- "content": "<|reserved_special_token_32|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128041": {
- "content": "<|reserved_special_token_33|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128042": {
- "content": "<|reserved_special_token_34|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128043": {
- "content": "<|reserved_special_token_35|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128044": {
- "content": "<|reserved_special_token_36|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128045": {
- "content": "<|reserved_special_token_37|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128046": {
- "content": "<|reserved_special_token_38|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128047": {
- "content": "<|reserved_special_token_39|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128048": {
- "content": "<|reserved_special_token_40|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128049": {
- "content": "<|reserved_special_token_41|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128050": {
- "content": "<|reserved_special_token_42|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128051": {
- "content": "<|reserved_special_token_43|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128052": {
- "content": "<|reserved_special_token_44|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128053": {
- "content": "<|reserved_special_token_45|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128054": {
- "content": "<|reserved_special_token_46|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128055": {
- "content": "<|reserved_special_token_47|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128056": {
- "content": "<|reserved_special_token_48|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128057": {
- "content": "<|reserved_special_token_49|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128058": {
- "content": "<|reserved_special_token_50|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128059": {
- "content": "<|reserved_special_token_51|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128060": {
- "content": "<|reserved_special_token_52|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128061": {
- "content": "<|reserved_special_token_53|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128062": {
- "content": "<|reserved_special_token_54|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128063": {
- "content": "<|reserved_special_token_55|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128064": {
- "content": "<|reserved_special_token_56|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128065": {
- "content": "<|reserved_special_token_57|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128066": {
- "content": "<|reserved_special_token_58|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128067": {
- "content": "<|reserved_special_token_59|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128068": {
- "content": "<|reserved_special_token_60|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128069": {
- "content": "<|reserved_special_token_61|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128070": {
- "content": "<|reserved_special_token_62|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128071": {
- "content": "<|reserved_special_token_63|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128072": {
- "content": "<|reserved_special_token_64|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128073": {
- "content": "<|reserved_special_token_65|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128074": {
- "content": "<|reserved_special_token_66|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128075": {
- "content": "<|reserved_special_token_67|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128076": {
- "content": "<|reserved_special_token_68|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128077": {
- "content": "<|reserved_special_token_69|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128078": {
- "content": "<|reserved_special_token_70|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128079": {
- "content": "<|reserved_special_token_71|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128080": {
- "content": "<|reserved_special_token_72|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128081": {
- "content": "<|reserved_special_token_73|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128082": {
- "content": "<|reserved_special_token_74|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128083": {
- "content": "<|reserved_special_token_75|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128084": {
- "content": "<|reserved_special_token_76|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128085": {
- "content": "<|reserved_special_token_77|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128086": {
- "content": "<|reserved_special_token_78|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128087": {
- "content": "<|reserved_special_token_79|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128088": {
- "content": "<|reserved_special_token_80|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128089": {
- "content": "<|reserved_special_token_81|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128090": {
- "content": "<|reserved_special_token_82|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128091": {
- "content": "<|reserved_special_token_83|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128092": {
- "content": "<|reserved_special_token_84|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128093": {
- "content": "<|reserved_special_token_85|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128094": {
- "content": "<|reserved_special_token_86|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128095": {
- "content": "<|reserved_special_token_87|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128096": {
- "content": "<|reserved_special_token_88|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128097": {
- "content": "<|reserved_special_token_89|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128098": {
- "content": "<|reserved_special_token_90|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128099": {
- "content": "<|reserved_special_token_91|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128100": {
- "content": "<|reserved_special_token_92|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128101": {
- "content": "<|reserved_special_token_93|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128102": {
- "content": "<|reserved_special_token_94|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128103": {
- "content": "<|reserved_special_token_95|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128104": {
- "content": "<|reserved_special_token_96|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128105": {
- "content": "<|reserved_special_token_97|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128106": {
- "content": "<|reserved_special_token_98|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128107": {
- "content": "<|reserved_special_token_99|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128108": {
- "content": "<|reserved_special_token_100|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128109": {
- "content": "<|reserved_special_token_101|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128110": {
- "content": "<|reserved_special_token_102|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128111": {
- "content": "<|reserved_special_token_103|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128112": {
- "content": "<|reserved_special_token_104|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128113": {
- "content": "<|reserved_special_token_105|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128114": {
- "content": "<|reserved_special_token_106|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128115": {
- "content": "<|reserved_special_token_107|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128116": {
- "content": "<|reserved_special_token_108|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128117": {
- "content": "<|reserved_special_token_109|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128118": {
- "content": "<|reserved_special_token_110|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128119": {
- "content": "<|reserved_special_token_111|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128120": {
- "content": "<|reserved_special_token_112|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128121": {
- "content": "<|reserved_special_token_113|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128122": {
- "content": "<|reserved_special_token_114|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128123": {
- "content": "<|reserved_special_token_115|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128124": {
- "content": "<|reserved_special_token_116|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128125": {
- "content": "<|reserved_special_token_117|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128126": {
- "content": "<|reserved_special_token_118|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128127": {
- "content": "<|reserved_special_token_119|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128128": {
- "content": "<|reserved_special_token_120|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128129": {
- "content": "<|reserved_special_token_121|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128130": {
- "content": "<|reserved_special_token_122|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128131": {
- "content": "<|reserved_special_token_123|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128132": {
- "content": "<|reserved_special_token_124|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128133": {
- "content": "<|reserved_special_token_125|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128134": {
- "content": "<|reserved_special_token_126|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128135": {
- "content": "<|reserved_special_token_127|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128136": {
- "content": "<|reserved_special_token_128|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128137": {
- "content": "<|reserved_special_token_129|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128138": {
- "content": "<|reserved_special_token_130|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128139": {
- "content": "<|reserved_special_token_131|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128140": {
- "content": "<|reserved_special_token_132|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128141": {
- "content": "<|reserved_special_token_133|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128142": {
- "content": "<|reserved_special_token_134|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128143": {
- "content": "<|reserved_special_token_135|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128144": {
- "content": "<|reserved_special_token_136|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128145": {
- "content": "<|reserved_special_token_137|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128146": {
- "content": "<|reserved_special_token_138|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128147": {
- "content": "<|reserved_special_token_139|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128148": {
- "content": "<|reserved_special_token_140|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128149": {
- "content": "<|reserved_special_token_141|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128150": {
- "content": "<|reserved_special_token_142|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128151": {
- "content": "<|reserved_special_token_143|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128152": {
- "content": "<|reserved_special_token_144|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128153": {
- "content": "<|reserved_special_token_145|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128154": {
- "content": "<|reserved_special_token_146|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128155": {
- "content": "<|reserved_special_token_147|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128156": {
- "content": "<|reserved_special_token_148|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128157": {
- "content": "<|reserved_special_token_149|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128158": {
- "content": "<|reserved_special_token_150|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128159": {
- "content": "<|reserved_special_token_151|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128160": {
- "content": "<|reserved_special_token_152|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128161": {
- "content": "<|reserved_special_token_153|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128162": {
- "content": "<|reserved_special_token_154|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128163": {
- "content": "<|reserved_special_token_155|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128164": {
- "content": "<|reserved_special_token_156|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128165": {
- "content": "<|reserved_special_token_157|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128166": {
- "content": "<|reserved_special_token_158|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128167": {
- "content": "<|reserved_special_token_159|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128168": {
- "content": "<|reserved_special_token_160|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128169": {
- "content": "<|reserved_special_token_161|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128170": {
- "content": "<|reserved_special_token_162|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128171": {
- "content": "<|reserved_special_token_163|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128172": {
- "content": "<|reserved_special_token_164|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128173": {
- "content": "<|reserved_special_token_165|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128174": {
- "content": "<|reserved_special_token_166|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128175": {
- "content": "<|reserved_special_token_167|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128176": {
- "content": "<|reserved_special_token_168|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128177": {
- "content": "<|reserved_special_token_169|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128178": {
- "content": "<|reserved_special_token_170|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128179": {
- "content": "<|reserved_special_token_171|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128180": {
- "content": "<|reserved_special_token_172|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128181": {
- "content": "<|reserved_special_token_173|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128182": {
- "content": "<|reserved_special_token_174|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128183": {
- "content": "<|reserved_special_token_175|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128184": {
- "content": "<|reserved_special_token_176|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128185": {
- "content": "<|reserved_special_token_177|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128186": {
- "content": "<|reserved_special_token_178|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128187": {
- "content": "<|reserved_special_token_179|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128188": {
- "content": "<|reserved_special_token_180|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128189": {
- "content": "<|reserved_special_token_181|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128190": {
- "content": "<|reserved_special_token_182|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128191": {
- "content": "<|reserved_special_token_183|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128192": {
- "content": "<|reserved_special_token_184|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128193": {
- "content": "<|reserved_special_token_185|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128194": {
- "content": "<|reserved_special_token_186|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128195": {
- "content": "<|reserved_special_token_187|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128196": {
- "content": "<|reserved_special_token_188|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128197": {
- "content": "<|reserved_special_token_189|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128198": {
- "content": "<|reserved_special_token_190|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128199": {
- "content": "<|reserved_special_token_191|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128200": {
- "content": "<|reserved_special_token_192|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128201": {
- "content": "<|reserved_special_token_193|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128202": {
- "content": "<|reserved_special_token_194|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128203": {
- "content": "<|reserved_special_token_195|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128204": {
- "content": "<|reserved_special_token_196|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128205": {
- "content": "<|reserved_special_token_197|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128206": {
- "content": "<|reserved_special_token_198|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128207": {
- "content": "<|reserved_special_token_199|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128208": {
- "content": "<|reserved_special_token_200|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128209": {
- "content": "<|reserved_special_token_201|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128210": {
- "content": "<|reserved_special_token_202|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128211": {
- "content": "<|reserved_special_token_203|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128212": {
- "content": "<|reserved_special_token_204|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128213": {
- "content": "<|reserved_special_token_205|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128214": {
- "content": "<|reserved_special_token_206|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128215": {
- "content": "<|reserved_special_token_207|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128216": {
- "content": "<|reserved_special_token_208|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128217": {
- "content": "<|reserved_special_token_209|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128218": {
- "content": "<|reserved_special_token_210|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128219": {
- "content": "<|reserved_special_token_211|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128220": {
- "content": "<|reserved_special_token_212|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128221": {
- "content": "<|reserved_special_token_213|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128222": {
- "content": "<|reserved_special_token_214|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128223": {
- "content": "<|reserved_special_token_215|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128224": {
- "content": "<|reserved_special_token_216|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128225": {
- "content": "<|reserved_special_token_217|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128226": {
- "content": "<|reserved_special_token_218|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128227": {
- "content": "<|reserved_special_token_219|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128228": {
- "content": "<|reserved_special_token_220|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128229": {
- "content": "<|reserved_special_token_221|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128230": {
- "content": "<|reserved_special_token_222|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128231": {
- "content": "<|reserved_special_token_223|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128232": {
- "content": "<|reserved_special_token_224|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128233": {
- "content": "<|reserved_special_token_225|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128234": {
- "content": "<|reserved_special_token_226|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128235": {
- "content": "<|reserved_special_token_227|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128236": {
- "content": "<|reserved_special_token_228|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128237": {
- "content": "<|reserved_special_token_229|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128238": {
- "content": "<|reserved_special_token_230|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128239": {
- "content": "<|reserved_special_token_231|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128240": {
- "content": "<|reserved_special_token_232|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128241": {
- "content": "<|reserved_special_token_233|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128242": {
- "content": "<|reserved_special_token_234|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128243": {
- "content": "<|reserved_special_token_235|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128244": {
- "content": "<|reserved_special_token_236|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128245": {
- "content": "<|reserved_special_token_237|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128246": {
- "content": "<|reserved_special_token_238|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128247": {
- "content": "<|reserved_special_token_239|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128248": {
- "content": "<|reserved_special_token_240|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128249": {
- "content": "<|reserved_special_token_241|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128250": {
- "content": "<|reserved_special_token_242|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128251": {
- "content": "<|reserved_special_token_243|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128252": {
- "content": "<|reserved_special_token_244|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128253": {
- "content": "<|reserved_special_token_245|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128254": {
- "content": "<|reserved_special_token_246|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128255": {
- "content": "<|reserved_special_token_247|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- }
- },
- "bos_token": "<|begin_of_text|>",
- "clean_up_tokenization_spaces": true,
- "eos_token": "<|eot_id|>",
- "extra_special_tokens": {},
- "model_input_names": [
- "input_ids",
- "attention_mask"
- ],
- "model_max_length": 131072,
- "pad_token": "<|eot_id|>",
- "tokenizer_class": "PreTrainedTokenizerFast"
-}
diff --git a/checkpoint-100/trainer_state.json b/checkpoint-100/trainer_state.json
deleted file mode 100644
index b85b9bb52bc4fe431a14b79564908be103d2ae3e..0000000000000000000000000000000000000000
--- a/checkpoint-100/trainer_state.json
+++ /dev/null
@@ -1,120 +0,0 @@
-{
- "best_global_step": 50,
- "best_metric": 0.7558398842811584,
- "best_model_checkpoint": null,
- "epoch": 10.0,
- "eval_steps": 50,
- "global_step": 100,
- "is_hyper_param_search": false,
- "is_local_process_zero": true,
- "is_world_process_zero": true,
- "log_history": [
- {
- "epoch": 1.0,
- "grad_norm": 1.4660576581954956,
- "learning_rate": 3.6e-05,
- "loss": 1.152,
- "step": 10
- },
- {
- "epoch": 2.0,
- "grad_norm": 0.8749533295631409,
- "learning_rate": 7.6e-05,
- "loss": 1.0421,
- "step": 20
- },
- {
- "epoch": 3.0,
- "grad_norm": 3.37060284614563,
- "learning_rate": 0.000116,
- "loss": 0.8539,
- "step": 30
- },
- {
- "epoch": 4.0,
- "grad_norm": 1.5355278253555298,
- "learning_rate": 0.00015600000000000002,
- "loss": 0.5483,
- "step": 40
- },
- {
- "epoch": 5.0,
- "grad_norm": 2.454838514328003,
- "learning_rate": 0.000196,
- "loss": 0.3736,
- "step": 50
- },
- {
- "epoch": 5.0,
- "eval_loss": 0.7558398842811584,
- "eval_runtime": 1.7227,
- "eval_samples_per_second": 2.902,
- "eval_steps_per_second": 2.902,
- "step": 50
- },
- {
- "epoch": 6.0,
- "grad_norm": 3.676417827606201,
- "learning_rate": 0.000196,
- "loss": 0.2291,
- "step": 60
- },
- {
- "epoch": 7.0,
- "grad_norm": 2.192375898361206,
- "learning_rate": 0.00019155555555555554,
- "loss": 0.1244,
- "step": 70
- },
- {
- "epoch": 8.0,
- "grad_norm": 2.630005359649658,
- "learning_rate": 0.00018711111111111112,
- "loss": 0.0862,
- "step": 80
- },
- {
- "epoch": 9.0,
- "grad_norm": 0.5021786093711853,
- "learning_rate": 0.00018266666666666667,
- "loss": 0.0614,
- "step": 90
- },
- {
- "epoch": 10.0,
- "grad_norm": 0.38170942664146423,
- "learning_rate": 0.00017822222222222222,
- "loss": 0.0471,
- "step": 100
- },
- {
- "epoch": 10.0,
- "eval_loss": 0.8806974291801453,
- "eval_runtime": 1.7764,
- "eval_samples_per_second": 2.815,
- "eval_steps_per_second": 2.815,
- "step": 100
- }
- ],
- "logging_steps": 10,
- "max_steps": 500,
- "num_input_tokens_seen": 0,
- "num_train_epochs": 50,
- "save_steps": 100,
- "stateful_callbacks": {
- "TrainerControl": {
- "args": {
- "should_epoch_stop": false,
- "should_evaluate": false,
- "should_log": false,
- "should_save": true,
- "should_training_stop": false
- },
- "attributes": {}
- }
- },
- "total_flos": 1.327550391386112e+16,
- "train_batch_size": 1,
- "trial_name": null,
- "trial_params": null
-}
diff --git a/checkpoint-100/training_args.bin b/checkpoint-100/training_args.bin
deleted file mode 100644
index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000
--- a/checkpoint-100/training_args.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f
-size 5777
diff --git a/checkpoint-200/README.md b/checkpoint-200/README.md
deleted file mode 100644
index da869e54abd54b0fea18dcc9516b16918f684370..0000000000000000000000000000000000000000
--- a/checkpoint-200/README.md
+++ /dev/null
@@ -1,207 +0,0 @@
----
-base_model: meta-llama/Llama-3.2-3B-Instruct
-library_name: peft
-pipeline_tag: text-generation
-tags:
-- base_model:adapter:meta-llama/Llama-3.2-3B-Instruct
-- lora
-- transformers
----
-
-# Model Card for Model ID
-
-
-
-
-
-## Model Details
-
-### Model Description
-
-
-
-
-
-- **Developed by:** [More Information Needed]
-- **Funded by [optional]:** [More Information Needed]
-- **Shared by [optional]:** [More Information Needed]
-- **Model type:** [More Information Needed]
-- **Language(s) (NLP):** [More Information Needed]
-- **License:** [More Information Needed]
-- **Finetuned from model [optional]:** [More Information Needed]
-
-### Model Sources [optional]
-
-
-
-- **Repository:** [More Information Needed]
-- **Paper [optional]:** [More Information Needed]
-- **Demo [optional]:** [More Information Needed]
-
-## Uses
-
-
-
-### Direct Use
-
-
-
-[More Information Needed]
-
-### Downstream Use [optional]
-
-
-
-[More Information Needed]
-
-### Out-of-Scope Use
-
-
-
-[More Information Needed]
-
-## Bias, Risks, and Limitations
-
-
-
-[More Information Needed]
-
-### Recommendations
-
-
-
-Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
-
-## How to Get Started with the Model
-
-Use the code below to get started with the model.
-
-[More Information Needed]
-
-## Training Details
-
-### Training Data
-
-
-
-[More Information Needed]
-
-### Training Procedure
-
-
-
-#### Preprocessing [optional]
-
-[More Information Needed]
-
-
-#### Training Hyperparameters
-
-- **Training regime:** [More Information Needed]
-
-#### Speeds, Sizes, Times [optional]
-
-
-
-[More Information Needed]
-
-## Evaluation
-
-
-
-### Testing Data, Factors & Metrics
-
-#### Testing Data
-
-
-
-[More Information Needed]
-
-#### Factors
-
-
-
-[More Information Needed]
-
-#### Metrics
-
-
-
-[More Information Needed]
-
-### Results
-
-[More Information Needed]
-
-#### Summary
-
-
-
-## Model Examination [optional]
-
-
-
-[More Information Needed]
-
-## Environmental Impact
-
-
-
-Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
-
-- **Hardware Type:** [More Information Needed]
-- **Hours used:** [More Information Needed]
-- **Cloud Provider:** [More Information Needed]
-- **Compute Region:** [More Information Needed]
-- **Carbon Emitted:** [More Information Needed]
-
-## Technical Specifications [optional]
-
-### Model Architecture and Objective
-
-[More Information Needed]
-
-### Compute Infrastructure
-
-[More Information Needed]
-
-#### Hardware
-
-[More Information Needed]
-
-#### Software
-
-[More Information Needed]
-
-## Citation [optional]
-
-
-
-**BibTeX:**
-
-[More Information Needed]
-
-**APA:**
-
-[More Information Needed]
-
-## Glossary [optional]
-
-
-
-[More Information Needed]
-
-## More Information [optional]
-
-[More Information Needed]
-
-## Model Card Authors [optional]
-
-[More Information Needed]
-
-## Model Card Contact
-
-[More Information Needed]
-### Framework versions
-
-- PEFT 0.17.1
\ No newline at end of file
diff --git a/checkpoint-200/adapter_config.json b/checkpoint-200/adapter_config.json
deleted file mode 100644
index c9a27d527a89fd0081c994e17bd2b908b8038d6e..0000000000000000000000000000000000000000
--- a/checkpoint-200/adapter_config.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
- "alpha_pattern": {},
- "auto_mapping": null,
- "base_model_name_or_path": "meta-llama/Llama-3.2-3B-Instruct",
- "bias": "none",
- "corda_config": null,
- "eva_config": null,
- "exclude_modules": null,
- "fan_in_fan_out": false,
- "inference_mode": true,
- "init_lora_weights": true,
- "layer_replication": null,
- "layers_pattern": null,
- "layers_to_transform": null,
- "loftq_config": {},
- "lora_alpha": 32,
- "lora_bias": false,
- "lora_dropout": 0.1,
- "megatron_config": null,
- "megatron_core": "megatron.core",
- "modules_to_save": null,
- "peft_type": "LORA",
- "qalora_group_size": 16,
- "r": 16,
- "rank_pattern": {},
- "revision": null,
- "target_modules": [
- "down_proj",
- "v_proj",
- "q_proj",
- "k_proj",
- "gate_proj",
- "o_proj",
- "up_proj"
- ],
- "target_parameters": null,
- "task_type": "CAUSAL_LM",
- "trainable_token_indices": null,
- "use_dora": false,
- "use_qalora": false,
- "use_rslora": false
-}
\ No newline at end of file
diff --git a/checkpoint-200/adapter_model.safetensors b/checkpoint-200/adapter_model.safetensors
deleted file mode 100644
index 2b3fa85b7a0b2b881f5ad32e10c70d80a5846133..0000000000000000000000000000000000000000
--- a/checkpoint-200/adapter_model.safetensors
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:10f314568bf765a9d52faf4b26b09d687304a1e227e75be06f046a06de38812a
-size 97307544
diff --git a/checkpoint-200/chat_template.jinja b/checkpoint-200/chat_template.jinja
deleted file mode 100644
index 1bad6a0f648dccdbec523ca79ba90fbcfc806af0..0000000000000000000000000000000000000000
--- a/checkpoint-200/chat_template.jinja
+++ /dev/null
@@ -1,93 +0,0 @@
-{{- bos_token }}
-{%- if custom_tools is defined %}
- {%- set tools = custom_tools %}
-{%- endif %}
-{%- if not tools_in_user_message is defined %}
- {%- set tools_in_user_message = true %}
-{%- endif %}
-{%- if not date_string is defined %}
- {%- if strftime_now is defined %}
- {%- set date_string = strftime_now("%d %b %Y") %}
- {%- else %}
- {%- set date_string = "26 Jul 2024" %}
- {%- endif %}
-{%- endif %}
-{%- if not tools is defined %}
- {%- set tools = none %}
-{%- endif %}
-
-{#- This block extracts the system message, so we can slot it into the right place. #}
-{%- if messages[0]['role'] == 'system' %}
- {%- set system_message = messages[0]['content']|trim %}
- {%- set messages = messages[1:] %}
-{%- else %}
- {%- set system_message = "" %}
-{%- endif %}
-
-{#- System message #}
-{{- "<|start_header_id|>system<|end_header_id|>\n\n" }}
-{%- if tools is not none %}
- {{- "Environment: ipython\n" }}
-{%- endif %}
-{{- "Cutting Knowledge Date: December 2023\n" }}
-{{- "Today Date: " + date_string + "\n\n" }}
-{%- if tools is not none and not tools_in_user_message %}
- {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
- {{- "Do not use variables.\n\n" }}
- {%- for t in tools %}
- {{- t | tojson(indent=4) }}
- {{- "\n\n" }}
- {%- endfor %}
-{%- endif %}
-{{- system_message }}
-{{- "<|eot_id|>" }}
-
-{#- Custom tools are passed in a user message with some extra guidance #}
-{%- if tools_in_user_message and not tools is none %}
- {#- Extract the first user message so we can plug it in here #}
- {%- if messages | length != 0 %}
- {%- set first_user_message = messages[0]['content']|trim %}
- {%- set messages = messages[1:] %}
- {%- else %}
- {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }}
-{%- endif %}
- {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}
- {{- "Given the following functions, please respond with a JSON for a function call " }}
- {{- "with its proper arguments that best answers the given prompt.\n\n" }}
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
- {{- "Do not use variables.\n\n" }}
- {%- for t in tools %}
- {{- t | tojson(indent=4) }}
- {{- "\n\n" }}
- {%- endfor %}
- {{- first_user_message + "<|eot_id|>"}}
-{%- endif %}
-
-{%- for message in messages %}
- {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}
- {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }}
- {%- elif 'tool_calls' in message %}
- {%- if not message.tool_calls|length == 1 %}
- {{- raise_exception("This model only supports single tool-calls at once!") }}
- {%- endif %}
- {%- set tool_call = message.tool_calls[0].function %}
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}
- {{- '{"name": "' + tool_call.name + '", ' }}
- {{- '"parameters": ' }}
- {{- tool_call.arguments | tojson }}
- {{- "}" }}
- {{- "<|eot_id|>" }}
- {%- elif message.role == "tool" or message.role == "ipython" %}
- {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }}
- {%- if message.content is mapping or message.content is iterable %}
- {{- message.content | tojson }}
- {%- else %}
- {{- message.content }}
- {%- endif %}
- {{- "<|eot_id|>" }}
- {%- endif %}
-{%- endfor %}
-{%- if add_generation_prompt %}
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}
-{%- endif %}
diff --git a/checkpoint-200/optimizer.pt b/checkpoint-200/optimizer.pt
deleted file mode 100644
index f3b02add2d4ca6a44295d48814dd6b7f776e823b..0000000000000000000000000000000000000000
--- a/checkpoint-200/optimizer.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:b6e4054c31ada60cdc2d5abc92ee7ae6a394f2aee4f62444f6182af065065469
-size 194846331
diff --git a/checkpoint-200/rng_state.pth b/checkpoint-200/rng_state.pth
deleted file mode 100644
index f90d2ea69ed0322133c0a511dcd98aef2e801910..0000000000000000000000000000000000000000
--- a/checkpoint-200/rng_state.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:5d4b19975224e425acc366825a1e7970a459487fa7a57ffeb1a94ad4de25fa1d
-size 14645
diff --git a/checkpoint-200/scaler.pt b/checkpoint-200/scaler.pt
deleted file mode 100644
index dce3572b315210d751b935f42f897c650110e0c7..0000000000000000000000000000000000000000
--- a/checkpoint-200/scaler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:124625e167eb28acbfc793cfcb3e8a08b32e7fea06501462bc9e420a5e1beb2a
-size 1383
diff --git a/checkpoint-200/scheduler.pt b/checkpoint-200/scheduler.pt
deleted file mode 100644
index 6293f8e8c13cfc93b4ba1fb58087d97a20041222..0000000000000000000000000000000000000000
--- a/checkpoint-200/scheduler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:37315ef08bfa8057ff315cea8e5349272ef9591e350519ec1b303f17a237220b
-size 1465
diff --git a/checkpoint-200/special_tokens_map.json b/checkpoint-200/special_tokens_map.json
deleted file mode 100644
index b43be96621d147110fb8a18b5776ec6e38516127..0000000000000000000000000000000000000000
--- a/checkpoint-200/special_tokens_map.json
+++ /dev/null
@@ -1,17 +0,0 @@
-{
- "bos_token": {
- "content": "<|begin_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "eos_token": {
- "content": "<|eot_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "pad_token": "<|eot_id|>"
-}
diff --git a/checkpoint-200/tokenizer.json b/checkpoint-200/tokenizer.json
deleted file mode 100644
index 8e89913d63cf04862fcbf301032ee349780489f2..0000000000000000000000000000000000000000
--- a/checkpoint-200/tokenizer.json
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:912e72517f7521f3273166a7879fe54c52b397f8c48ea80f8f1ed794beb24c09
-size 17210184
diff --git a/checkpoint-200/tokenizer_config.json b/checkpoint-200/tokenizer_config.json
deleted file mode 100644
index 3beeacc86a6ca3cae14ad3004263ab74a4bac07a..0000000000000000000000000000000000000000
--- a/checkpoint-200/tokenizer_config.json
+++ /dev/null
@@ -1,2063 +0,0 @@
-{
- "added_tokens_decoder": {
- "128000": {
- "content": "<|begin_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128001": {
- "content": "<|end_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128002": {
- "content": "<|reserved_special_token_0|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128003": {
- "content": "<|reserved_special_token_1|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128004": {
- "content": "<|finetune_right_pad_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128005": {
- "content": "<|reserved_special_token_2|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128006": {
- "content": "<|start_header_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128007": {
- "content": "<|end_header_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128008": {
- "content": "<|eom_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128009": {
- "content": "<|eot_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128010": {
- "content": "<|python_tag|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128011": {
- "content": "<|reserved_special_token_3|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128012": {
- "content": "<|reserved_special_token_4|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128013": {
- "content": "<|reserved_special_token_5|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128014": {
- "content": "<|reserved_special_token_6|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128015": {
- "content": "<|reserved_special_token_7|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128016": {
- "content": "<|reserved_special_token_8|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128017": {
- "content": "<|reserved_special_token_9|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128018": {
- "content": "<|reserved_special_token_10|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128019": {
- "content": "<|reserved_special_token_11|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128020": {
- "content": "<|reserved_special_token_12|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128021": {
- "content": "<|reserved_special_token_13|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128022": {
- "content": "<|reserved_special_token_14|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128023": {
- "content": "<|reserved_special_token_15|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128024": {
- "content": "<|reserved_special_token_16|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128025": {
- "content": "<|reserved_special_token_17|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128026": {
- "content": "<|reserved_special_token_18|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128027": {
- "content": "<|reserved_special_token_19|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128028": {
- "content": "<|reserved_special_token_20|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128029": {
- "content": "<|reserved_special_token_21|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128030": {
- "content": "<|reserved_special_token_22|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128031": {
- "content": "<|reserved_special_token_23|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128032": {
- "content": "<|reserved_special_token_24|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128033": {
- "content": "<|reserved_special_token_25|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128034": {
- "content": "<|reserved_special_token_26|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128035": {
- "content": "<|reserved_special_token_27|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128036": {
- "content": "<|reserved_special_token_28|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128037": {
- "content": "<|reserved_special_token_29|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128038": {
- "content": "<|reserved_special_token_30|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128039": {
- "content": "<|reserved_special_token_31|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128040": {
- "content": "<|reserved_special_token_32|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128041": {
- "content": "<|reserved_special_token_33|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128042": {
- "content": "<|reserved_special_token_34|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128043": {
- "content": "<|reserved_special_token_35|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128044": {
- "content": "<|reserved_special_token_36|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128045": {
- "content": "<|reserved_special_token_37|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128046": {
- "content": "<|reserved_special_token_38|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128047": {
- "content": "<|reserved_special_token_39|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128048": {
- "content": "<|reserved_special_token_40|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128049": {
- "content": "<|reserved_special_token_41|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128050": {
- "content": "<|reserved_special_token_42|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128051": {
- "content": "<|reserved_special_token_43|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128052": {
- "content": "<|reserved_special_token_44|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128053": {
- "content": "<|reserved_special_token_45|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128054": {
- "content": "<|reserved_special_token_46|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128055": {
- "content": "<|reserved_special_token_47|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128056": {
- "content": "<|reserved_special_token_48|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128057": {
- "content": "<|reserved_special_token_49|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128058": {
- "content": "<|reserved_special_token_50|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128059": {
- "content": "<|reserved_special_token_51|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128060": {
- "content": "<|reserved_special_token_52|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128061": {
- "content": "<|reserved_special_token_53|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128062": {
- "content": "<|reserved_special_token_54|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128063": {
- "content": "<|reserved_special_token_55|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128064": {
- "content": "<|reserved_special_token_56|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128065": {
- "content": "<|reserved_special_token_57|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128066": {
- "content": "<|reserved_special_token_58|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128067": {
- "content": "<|reserved_special_token_59|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128068": {
- "content": "<|reserved_special_token_60|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128069": {
- "content": "<|reserved_special_token_61|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128070": {
- "content": "<|reserved_special_token_62|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128071": {
- "content": "<|reserved_special_token_63|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128072": {
- "content": "<|reserved_special_token_64|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128073": {
- "content": "<|reserved_special_token_65|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128074": {
- "content": "<|reserved_special_token_66|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128075": {
- "content": "<|reserved_special_token_67|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128076": {
- "content": "<|reserved_special_token_68|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128077": {
- "content": "<|reserved_special_token_69|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128078": {
- "content": "<|reserved_special_token_70|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128079": {
- "content": "<|reserved_special_token_71|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128080": {
- "content": "<|reserved_special_token_72|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128081": {
- "content": "<|reserved_special_token_73|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128082": {
- "content": "<|reserved_special_token_74|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128083": {
- "content": "<|reserved_special_token_75|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128084": {
- "content": "<|reserved_special_token_76|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128085": {
- "content": "<|reserved_special_token_77|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128086": {
- "content": "<|reserved_special_token_78|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128087": {
- "content": "<|reserved_special_token_79|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128088": {
- "content": "<|reserved_special_token_80|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128089": {
- "content": "<|reserved_special_token_81|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128090": {
- "content": "<|reserved_special_token_82|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128091": {
- "content": "<|reserved_special_token_83|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128092": {
- "content": "<|reserved_special_token_84|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128093": {
- "content": "<|reserved_special_token_85|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128094": {
- "content": "<|reserved_special_token_86|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128095": {
- "content": "<|reserved_special_token_87|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128096": {
- "content": "<|reserved_special_token_88|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128097": {
- "content": "<|reserved_special_token_89|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128098": {
- "content": "<|reserved_special_token_90|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128099": {
- "content": "<|reserved_special_token_91|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128100": {
- "content": "<|reserved_special_token_92|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128101": {
- "content": "<|reserved_special_token_93|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128102": {
- "content": "<|reserved_special_token_94|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128103": {
- "content": "<|reserved_special_token_95|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128104": {
- "content": "<|reserved_special_token_96|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128105": {
- "content": "<|reserved_special_token_97|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128106": {
- "content": "<|reserved_special_token_98|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128107": {
- "content": "<|reserved_special_token_99|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128108": {
- "content": "<|reserved_special_token_100|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128109": {
- "content": "<|reserved_special_token_101|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128110": {
- "content": "<|reserved_special_token_102|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128111": {
- "content": "<|reserved_special_token_103|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128112": {
- "content": "<|reserved_special_token_104|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128113": {
- "content": "<|reserved_special_token_105|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128114": {
- "content": "<|reserved_special_token_106|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128115": {
- "content": "<|reserved_special_token_107|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128116": {
- "content": "<|reserved_special_token_108|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128117": {
- "content": "<|reserved_special_token_109|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128118": {
- "content": "<|reserved_special_token_110|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128119": {
- "content": "<|reserved_special_token_111|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128120": {
- "content": "<|reserved_special_token_112|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128121": {
- "content": "<|reserved_special_token_113|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128122": {
- "content": "<|reserved_special_token_114|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128123": {
- "content": "<|reserved_special_token_115|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128124": {
- "content": "<|reserved_special_token_116|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128125": {
- "content": "<|reserved_special_token_117|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128126": {
- "content": "<|reserved_special_token_118|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128127": {
- "content": "<|reserved_special_token_119|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128128": {
- "content": "<|reserved_special_token_120|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128129": {
- "content": "<|reserved_special_token_121|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128130": {
- "content": "<|reserved_special_token_122|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128131": {
- "content": "<|reserved_special_token_123|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128132": {
- "content": "<|reserved_special_token_124|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128133": {
- "content": "<|reserved_special_token_125|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128134": {
- "content": "<|reserved_special_token_126|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128135": {
- "content": "<|reserved_special_token_127|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128136": {
- "content": "<|reserved_special_token_128|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128137": {
- "content": "<|reserved_special_token_129|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128138": {
- "content": "<|reserved_special_token_130|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128139": {
- "content": "<|reserved_special_token_131|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128140": {
- "content": "<|reserved_special_token_132|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128141": {
- "content": "<|reserved_special_token_133|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128142": {
- "content": "<|reserved_special_token_134|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128143": {
- "content": "<|reserved_special_token_135|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128144": {
- "content": "<|reserved_special_token_136|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128145": {
- "content": "<|reserved_special_token_137|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128146": {
- "content": "<|reserved_special_token_138|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128147": {
- "content": "<|reserved_special_token_139|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128148": {
- "content": "<|reserved_special_token_140|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128149": {
- "content": "<|reserved_special_token_141|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128150": {
- "content": "<|reserved_special_token_142|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128151": {
- "content": "<|reserved_special_token_143|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128152": {
- "content": "<|reserved_special_token_144|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128153": {
- "content": "<|reserved_special_token_145|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128154": {
- "content": "<|reserved_special_token_146|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128155": {
- "content": "<|reserved_special_token_147|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128156": {
- "content": "<|reserved_special_token_148|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128157": {
- "content": "<|reserved_special_token_149|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128158": {
- "content": "<|reserved_special_token_150|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128159": {
- "content": "<|reserved_special_token_151|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128160": {
- "content": "<|reserved_special_token_152|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128161": {
- "content": "<|reserved_special_token_153|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128162": {
- "content": "<|reserved_special_token_154|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128163": {
- "content": "<|reserved_special_token_155|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128164": {
- "content": "<|reserved_special_token_156|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128165": {
- "content": "<|reserved_special_token_157|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128166": {
- "content": "<|reserved_special_token_158|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128167": {
- "content": "<|reserved_special_token_159|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128168": {
- "content": "<|reserved_special_token_160|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128169": {
- "content": "<|reserved_special_token_161|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128170": {
- "content": "<|reserved_special_token_162|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128171": {
- "content": "<|reserved_special_token_163|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128172": {
- "content": "<|reserved_special_token_164|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128173": {
- "content": "<|reserved_special_token_165|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128174": {
- "content": "<|reserved_special_token_166|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128175": {
- "content": "<|reserved_special_token_167|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128176": {
- "content": "<|reserved_special_token_168|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128177": {
- "content": "<|reserved_special_token_169|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128178": {
- "content": "<|reserved_special_token_170|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128179": {
- "content": "<|reserved_special_token_171|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128180": {
- "content": "<|reserved_special_token_172|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128181": {
- "content": "<|reserved_special_token_173|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128182": {
- "content": "<|reserved_special_token_174|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128183": {
- "content": "<|reserved_special_token_175|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128184": {
- "content": "<|reserved_special_token_176|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128185": {
- "content": "<|reserved_special_token_177|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128186": {
- "content": "<|reserved_special_token_178|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128187": {
- "content": "<|reserved_special_token_179|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128188": {
- "content": "<|reserved_special_token_180|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128189": {
- "content": "<|reserved_special_token_181|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128190": {
- "content": "<|reserved_special_token_182|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128191": {
- "content": "<|reserved_special_token_183|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128192": {
- "content": "<|reserved_special_token_184|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128193": {
- "content": "<|reserved_special_token_185|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128194": {
- "content": "<|reserved_special_token_186|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128195": {
- "content": "<|reserved_special_token_187|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128196": {
- "content": "<|reserved_special_token_188|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128197": {
- "content": "<|reserved_special_token_189|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128198": {
- "content": "<|reserved_special_token_190|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128199": {
- "content": "<|reserved_special_token_191|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128200": {
- "content": "<|reserved_special_token_192|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128201": {
- "content": "<|reserved_special_token_193|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128202": {
- "content": "<|reserved_special_token_194|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128203": {
- "content": "<|reserved_special_token_195|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128204": {
- "content": "<|reserved_special_token_196|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128205": {
- "content": "<|reserved_special_token_197|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128206": {
- "content": "<|reserved_special_token_198|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128207": {
- "content": "<|reserved_special_token_199|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128208": {
- "content": "<|reserved_special_token_200|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128209": {
- "content": "<|reserved_special_token_201|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128210": {
- "content": "<|reserved_special_token_202|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128211": {
- "content": "<|reserved_special_token_203|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128212": {
- "content": "<|reserved_special_token_204|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128213": {
- "content": "<|reserved_special_token_205|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128214": {
- "content": "<|reserved_special_token_206|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128215": {
- "content": "<|reserved_special_token_207|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128216": {
- "content": "<|reserved_special_token_208|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128217": {
- "content": "<|reserved_special_token_209|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128218": {
- "content": "<|reserved_special_token_210|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128219": {
- "content": "<|reserved_special_token_211|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128220": {
- "content": "<|reserved_special_token_212|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128221": {
- "content": "<|reserved_special_token_213|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128222": {
- "content": "<|reserved_special_token_214|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128223": {
- "content": "<|reserved_special_token_215|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128224": {
- "content": "<|reserved_special_token_216|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128225": {
- "content": "<|reserved_special_token_217|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128226": {
- "content": "<|reserved_special_token_218|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128227": {
- "content": "<|reserved_special_token_219|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128228": {
- "content": "<|reserved_special_token_220|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128229": {
- "content": "<|reserved_special_token_221|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128230": {
- "content": "<|reserved_special_token_222|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128231": {
- "content": "<|reserved_special_token_223|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128232": {
- "content": "<|reserved_special_token_224|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128233": {
- "content": "<|reserved_special_token_225|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128234": {
- "content": "<|reserved_special_token_226|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128235": {
- "content": "<|reserved_special_token_227|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128236": {
- "content": "<|reserved_special_token_228|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128237": {
- "content": "<|reserved_special_token_229|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128238": {
- "content": "<|reserved_special_token_230|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128239": {
- "content": "<|reserved_special_token_231|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128240": {
- "content": "<|reserved_special_token_232|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128241": {
- "content": "<|reserved_special_token_233|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128242": {
- "content": "<|reserved_special_token_234|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128243": {
- "content": "<|reserved_special_token_235|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128244": {
- "content": "<|reserved_special_token_236|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128245": {
- "content": "<|reserved_special_token_237|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128246": {
- "content": "<|reserved_special_token_238|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128247": {
- "content": "<|reserved_special_token_239|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128248": {
- "content": "<|reserved_special_token_240|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128249": {
- "content": "<|reserved_special_token_241|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128250": {
- "content": "<|reserved_special_token_242|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128251": {
- "content": "<|reserved_special_token_243|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128252": {
- "content": "<|reserved_special_token_244|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128253": {
- "content": "<|reserved_special_token_245|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128254": {
- "content": "<|reserved_special_token_246|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128255": {
- "content": "<|reserved_special_token_247|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- }
- },
- "bos_token": "<|begin_of_text|>",
- "clean_up_tokenization_spaces": true,
- "eos_token": "<|eot_id|>",
- "extra_special_tokens": {},
- "model_input_names": [
- "input_ids",
- "attention_mask"
- ],
- "model_max_length": 131072,
- "pad_token": "<|eot_id|>",
- "tokenizer_class": "PreTrainedTokenizerFast"
-}
diff --git a/checkpoint-200/trainer_state.json b/checkpoint-200/trainer_state.json
deleted file mode 100644
index f3e9d0600dc1755fa0c2b644f7857612aedbc180..0000000000000000000000000000000000000000
--- a/checkpoint-200/trainer_state.json
+++ /dev/null
@@ -1,206 +0,0 @@
-{
- "best_global_step": 50,
- "best_metric": 0.7558398842811584,
- "best_model_checkpoint": null,
- "epoch": 20.0,
- "eval_steps": 50,
- "global_step": 200,
- "is_hyper_param_search": false,
- "is_local_process_zero": true,
- "is_world_process_zero": true,
- "log_history": [
- {
- "epoch": 1.0,
- "grad_norm": 1.4660576581954956,
- "learning_rate": 3.6e-05,
- "loss": 1.152,
- "step": 10
- },
- {
- "epoch": 2.0,
- "grad_norm": 0.8749533295631409,
- "learning_rate": 7.6e-05,
- "loss": 1.0421,
- "step": 20
- },
- {
- "epoch": 3.0,
- "grad_norm": 3.37060284614563,
- "learning_rate": 0.000116,
- "loss": 0.8539,
- "step": 30
- },
- {
- "epoch": 4.0,
- "grad_norm": 1.5355278253555298,
- "learning_rate": 0.00015600000000000002,
- "loss": 0.5483,
- "step": 40
- },
- {
- "epoch": 5.0,
- "grad_norm": 2.454838514328003,
- "learning_rate": 0.000196,
- "loss": 0.3736,
- "step": 50
- },
- {
- "epoch": 5.0,
- "eval_loss": 0.7558398842811584,
- "eval_runtime": 1.7227,
- "eval_samples_per_second": 2.902,
- "eval_steps_per_second": 2.902,
- "step": 50
- },
- {
- "epoch": 6.0,
- "grad_norm": 3.676417827606201,
- "learning_rate": 0.000196,
- "loss": 0.2291,
- "step": 60
- },
- {
- "epoch": 7.0,
- "grad_norm": 2.192375898361206,
- "learning_rate": 0.00019155555555555554,
- "loss": 0.1244,
- "step": 70
- },
- {
- "epoch": 8.0,
- "grad_norm": 2.630005359649658,
- "learning_rate": 0.00018711111111111112,
- "loss": 0.0862,
- "step": 80
- },
- {
- "epoch": 9.0,
- "grad_norm": 0.5021786093711853,
- "learning_rate": 0.00018266666666666667,
- "loss": 0.0614,
- "step": 90
- },
- {
- "epoch": 10.0,
- "grad_norm": 0.38170942664146423,
- "learning_rate": 0.00017822222222222222,
- "loss": 0.0471,
- "step": 100
- },
- {
- "epoch": 10.0,
- "eval_loss": 0.8806974291801453,
- "eval_runtime": 1.7764,
- "eval_samples_per_second": 2.815,
- "eval_steps_per_second": 2.815,
- "step": 100
- },
- {
- "epoch": 11.0,
- "grad_norm": 1.223647952079773,
- "learning_rate": 0.0001737777777777778,
- "loss": 0.0359,
- "step": 110
- },
- {
- "epoch": 12.0,
- "grad_norm": 0.5452818870544434,
- "learning_rate": 0.00016933333333333335,
- "loss": 0.0289,
- "step": 120
- },
- {
- "epoch": 13.0,
- "grad_norm": 0.19034886360168457,
- "learning_rate": 0.0001648888888888889,
- "loss": 0.029,
- "step": 130
- },
- {
- "epoch": 14.0,
- "grad_norm": 0.7483140230178833,
- "learning_rate": 0.00016044444444444445,
- "loss": 0.0247,
- "step": 140
- },
- {
- "epoch": 15.0,
- "grad_norm": 0.34800082445144653,
- "learning_rate": 0.00015600000000000002,
- "loss": 0.0193,
- "step": 150
- },
- {
- "epoch": 15.0,
- "eval_loss": 0.9916993379592896,
- "eval_runtime": 1.7667,
- "eval_samples_per_second": 2.83,
- "eval_steps_per_second": 2.83,
- "step": 150
- },
- {
- "epoch": 16.0,
- "grad_norm": 0.24237586557865143,
- "learning_rate": 0.00015155555555555557,
- "loss": 0.0176,
- "step": 160
- },
- {
- "epoch": 17.0,
- "grad_norm": 0.13607177138328552,
- "learning_rate": 0.00014711111111111112,
- "loss": 0.0131,
- "step": 170
- },
- {
- "epoch": 18.0,
- "grad_norm": 0.3655266761779785,
- "learning_rate": 0.00014266666666666667,
- "loss": 0.0164,
- "step": 180
- },
- {
- "epoch": 19.0,
- "grad_norm": 0.08258651196956635,
- "learning_rate": 0.00013822222222222222,
- "loss": 0.013,
- "step": 190
- },
- {
- "epoch": 20.0,
- "grad_norm": 0.1830163151025772,
- "learning_rate": 0.00013377777777777777,
- "loss": 0.0126,
- "step": 200
- },
- {
- "epoch": 20.0,
- "eval_loss": 1.0726474523544312,
- "eval_runtime": 1.7657,
- "eval_samples_per_second": 2.832,
- "eval_steps_per_second": 2.832,
- "step": 200
- }
- ],
- "logging_steps": 10,
- "max_steps": 500,
- "num_input_tokens_seen": 0,
- "num_train_epochs": 50,
- "save_steps": 100,
- "stateful_callbacks": {
- "TrainerControl": {
- "args": {
- "should_epoch_stop": false,
- "should_evaluate": false,
- "should_log": false,
- "should_save": true,
- "should_training_stop": false
- },
- "attributes": {}
- }
- },
- "total_flos": 2.655100782772224e+16,
- "train_batch_size": 1,
- "trial_name": null,
- "trial_params": null
-}
diff --git a/checkpoint-200/training_args.bin b/checkpoint-200/training_args.bin
deleted file mode 100644
index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000
--- a/checkpoint-200/training_args.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f
-size 5777
diff --git a/checkpoint-300/README.md b/checkpoint-300/README.md
deleted file mode 100644
index da869e54abd54b0fea18dcc9516b16918f684370..0000000000000000000000000000000000000000
--- a/checkpoint-300/README.md
+++ /dev/null
@@ -1,207 +0,0 @@
----
-base_model: meta-llama/Llama-3.2-3B-Instruct
-library_name: peft
-pipeline_tag: text-generation
-tags:
-- base_model:adapter:meta-llama/Llama-3.2-3B-Instruct
-- lora
-- transformers
----
-
-# Model Card for Model ID
-
-
-
-
-
-## Model Details
-
-### Model Description
-
-
-
-
-
-- **Developed by:** [More Information Needed]
-- **Funded by [optional]:** [More Information Needed]
-- **Shared by [optional]:** [More Information Needed]
-- **Model type:** [More Information Needed]
-- **Language(s) (NLP):** [More Information Needed]
-- **License:** [More Information Needed]
-- **Finetuned from model [optional]:** [More Information Needed]
-
-### Model Sources [optional]
-
-
-
-- **Repository:** [More Information Needed]
-- **Paper [optional]:** [More Information Needed]
-- **Demo [optional]:** [More Information Needed]
-
-## Uses
-
-
-
-### Direct Use
-
-
-
-[More Information Needed]
-
-### Downstream Use [optional]
-
-
-
-[More Information Needed]
-
-### Out-of-Scope Use
-
-
-
-[More Information Needed]
-
-## Bias, Risks, and Limitations
-
-
-
-[More Information Needed]
-
-### Recommendations
-
-
-
-Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
-
-## How to Get Started with the Model
-
-Use the code below to get started with the model.
-
-[More Information Needed]
-
-## Training Details
-
-### Training Data
-
-
-
-[More Information Needed]
-
-### Training Procedure
-
-
-
-#### Preprocessing [optional]
-
-[More Information Needed]
-
-
-#### Training Hyperparameters
-
-- **Training regime:** [More Information Needed]
-
-#### Speeds, Sizes, Times [optional]
-
-
-
-[More Information Needed]
-
-## Evaluation
-
-
-
-### Testing Data, Factors & Metrics
-
-#### Testing Data
-
-
-
-[More Information Needed]
-
-#### Factors
-
-
-
-[More Information Needed]
-
-#### Metrics
-
-
-
-[More Information Needed]
-
-### Results
-
-[More Information Needed]
-
-#### Summary
-
-
-
-## Model Examination [optional]
-
-
-
-[More Information Needed]
-
-## Environmental Impact
-
-
-
-Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
-
-- **Hardware Type:** [More Information Needed]
-- **Hours used:** [More Information Needed]
-- **Cloud Provider:** [More Information Needed]
-- **Compute Region:** [More Information Needed]
-- **Carbon Emitted:** [More Information Needed]
-
-## Technical Specifications [optional]
-
-### Model Architecture and Objective
-
-[More Information Needed]
-
-### Compute Infrastructure
-
-[More Information Needed]
-
-#### Hardware
-
-[More Information Needed]
-
-#### Software
-
-[More Information Needed]
-
-## Citation [optional]
-
-
-
-**BibTeX:**
-
-[More Information Needed]
-
-**APA:**
-
-[More Information Needed]
-
-## Glossary [optional]
-
-
-
-[More Information Needed]
-
-## More Information [optional]
-
-[More Information Needed]
-
-## Model Card Authors [optional]
-
-[More Information Needed]
-
-## Model Card Contact
-
-[More Information Needed]
-### Framework versions
-
-- PEFT 0.17.1
\ No newline at end of file
diff --git a/checkpoint-300/adapter_config.json b/checkpoint-300/adapter_config.json
deleted file mode 100644
index c9a27d527a89fd0081c994e17bd2b908b8038d6e..0000000000000000000000000000000000000000
--- a/checkpoint-300/adapter_config.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
- "alpha_pattern": {},
- "auto_mapping": null,
- "base_model_name_or_path": "meta-llama/Llama-3.2-3B-Instruct",
- "bias": "none",
- "corda_config": null,
- "eva_config": null,
- "exclude_modules": null,
- "fan_in_fan_out": false,
- "inference_mode": true,
- "init_lora_weights": true,
- "layer_replication": null,
- "layers_pattern": null,
- "layers_to_transform": null,
- "loftq_config": {},
- "lora_alpha": 32,
- "lora_bias": false,
- "lora_dropout": 0.1,
- "megatron_config": null,
- "megatron_core": "megatron.core",
- "modules_to_save": null,
- "peft_type": "LORA",
- "qalora_group_size": 16,
- "r": 16,
- "rank_pattern": {},
- "revision": null,
- "target_modules": [
- "down_proj",
- "v_proj",
- "q_proj",
- "k_proj",
- "gate_proj",
- "o_proj",
- "up_proj"
- ],
- "target_parameters": null,
- "task_type": "CAUSAL_LM",
- "trainable_token_indices": null,
- "use_dora": false,
- "use_qalora": false,
- "use_rslora": false
-}
\ No newline at end of file
diff --git a/checkpoint-300/adapter_model.safetensors b/checkpoint-300/adapter_model.safetensors
deleted file mode 100644
index fa02e67ef636431f3f1bd7bb50a45abc4d431e75..0000000000000000000000000000000000000000
--- a/checkpoint-300/adapter_model.safetensors
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:14af55caa175ef52c41fa5f381b7e459ab1e20ca247f29b76a1731a7dbd687a1
-size 97307544
diff --git a/checkpoint-300/chat_template.jinja b/checkpoint-300/chat_template.jinja
deleted file mode 100644
index 1bad6a0f648dccdbec523ca79ba90fbcfc806af0..0000000000000000000000000000000000000000
--- a/checkpoint-300/chat_template.jinja
+++ /dev/null
@@ -1,93 +0,0 @@
-{{- bos_token }}
-{%- if custom_tools is defined %}
- {%- set tools = custom_tools %}
-{%- endif %}
-{%- if not tools_in_user_message is defined %}
- {%- set tools_in_user_message = true %}
-{%- endif %}
-{%- if not date_string is defined %}
- {%- if strftime_now is defined %}
- {%- set date_string = strftime_now("%d %b %Y") %}
- {%- else %}
- {%- set date_string = "26 Jul 2024" %}
- {%- endif %}
-{%- endif %}
-{%- if not tools is defined %}
- {%- set tools = none %}
-{%- endif %}
-
-{#- This block extracts the system message, so we can slot it into the right place. #}
-{%- if messages[0]['role'] == 'system' %}
- {%- set system_message = messages[0]['content']|trim %}
- {%- set messages = messages[1:] %}
-{%- else %}
- {%- set system_message = "" %}
-{%- endif %}
-
-{#- System message #}
-{{- "<|start_header_id|>system<|end_header_id|>\n\n" }}
-{%- if tools is not none %}
- {{- "Environment: ipython\n" }}
-{%- endif %}
-{{- "Cutting Knowledge Date: December 2023\n" }}
-{{- "Today Date: " + date_string + "\n\n" }}
-{%- if tools is not none and not tools_in_user_message %}
- {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
- {{- "Do not use variables.\n\n" }}
- {%- for t in tools %}
- {{- t | tojson(indent=4) }}
- {{- "\n\n" }}
- {%- endfor %}
-{%- endif %}
-{{- system_message }}
-{{- "<|eot_id|>" }}
-
-{#- Custom tools are passed in a user message with some extra guidance #}
-{%- if tools_in_user_message and not tools is none %}
- {#- Extract the first user message so we can plug it in here #}
- {%- if messages | length != 0 %}
- {%- set first_user_message = messages[0]['content']|trim %}
- {%- set messages = messages[1:] %}
- {%- else %}
- {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }}
-{%- endif %}
- {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}
- {{- "Given the following functions, please respond with a JSON for a function call " }}
- {{- "with its proper arguments that best answers the given prompt.\n\n" }}
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
- {{- "Do not use variables.\n\n" }}
- {%- for t in tools %}
- {{- t | tojson(indent=4) }}
- {{- "\n\n" }}
- {%- endfor %}
- {{- first_user_message + "<|eot_id|>"}}
-{%- endif %}
-
-{%- for message in messages %}
- {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}
- {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }}
- {%- elif 'tool_calls' in message %}
- {%- if not message.tool_calls|length == 1 %}
- {{- raise_exception("This model only supports single tool-calls at once!") }}
- {%- endif %}
- {%- set tool_call = message.tool_calls[0].function %}
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}
- {{- '{"name": "' + tool_call.name + '", ' }}
- {{- '"parameters": ' }}
- {{- tool_call.arguments | tojson }}
- {{- "}" }}
- {{- "<|eot_id|>" }}
- {%- elif message.role == "tool" or message.role == "ipython" %}
- {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }}
- {%- if message.content is mapping or message.content is iterable %}
- {{- message.content | tojson }}
- {%- else %}
- {{- message.content }}
- {%- endif %}
- {{- "<|eot_id|>" }}
- {%- endif %}
-{%- endfor %}
-{%- if add_generation_prompt %}
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}
-{%- endif %}
diff --git a/checkpoint-300/optimizer.pt b/checkpoint-300/optimizer.pt
deleted file mode 100644
index fbe8a79cd43aa475b2625c579adcaf7b916880ea..0000000000000000000000000000000000000000
--- a/checkpoint-300/optimizer.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:11a8648049805bd21b4256f97311f1c7e5d02c1a70b65f964c5bf4c6bbea76db
-size 194846331
diff --git a/checkpoint-300/rng_state.pth b/checkpoint-300/rng_state.pth
deleted file mode 100644
index f9d54aec27333781cf245af3b0d9f6021b912fd0..0000000000000000000000000000000000000000
--- a/checkpoint-300/rng_state.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:fbeebc7cba55f82e50391dff743835517526f978147ac553bab00af14778c49f
-size 14645
diff --git a/checkpoint-300/scaler.pt b/checkpoint-300/scaler.pt
deleted file mode 100644
index 872dde653491aa0ae40076c2acf51d2ae74df8ca..0000000000000000000000000000000000000000
--- a/checkpoint-300/scaler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:30af866df24edce708e1eb20700878b402fa05707fa9bc5f332496baf440dbbb
-size 1383
diff --git a/checkpoint-300/scheduler.pt b/checkpoint-300/scheduler.pt
deleted file mode 100644
index f1c1f6fce8c95692de3ea5fa744ec3bb94beda20..0000000000000000000000000000000000000000
--- a/checkpoint-300/scheduler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:ad080a2632c9b5ed3878ced74ddb263235bce94c1d8e5dcafc6c1256600d3693
-size 1465
diff --git a/checkpoint-300/special_tokens_map.json b/checkpoint-300/special_tokens_map.json
deleted file mode 100644
index b43be96621d147110fb8a18b5776ec6e38516127..0000000000000000000000000000000000000000
--- a/checkpoint-300/special_tokens_map.json
+++ /dev/null
@@ -1,17 +0,0 @@
-{
- "bos_token": {
- "content": "<|begin_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "eos_token": {
- "content": "<|eot_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "pad_token": "<|eot_id|>"
-}
diff --git a/checkpoint-300/tokenizer.json b/checkpoint-300/tokenizer.json
deleted file mode 100644
index 8e89913d63cf04862fcbf301032ee349780489f2..0000000000000000000000000000000000000000
--- a/checkpoint-300/tokenizer.json
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:912e72517f7521f3273166a7879fe54c52b397f8c48ea80f8f1ed794beb24c09
-size 17210184
diff --git a/checkpoint-300/tokenizer_config.json b/checkpoint-300/tokenizer_config.json
deleted file mode 100644
index 3beeacc86a6ca3cae14ad3004263ab74a4bac07a..0000000000000000000000000000000000000000
--- a/checkpoint-300/tokenizer_config.json
+++ /dev/null
@@ -1,2063 +0,0 @@
-{
- "added_tokens_decoder": {
- "128000": {
- "content": "<|begin_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128001": {
- "content": "<|end_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128002": {
- "content": "<|reserved_special_token_0|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128003": {
- "content": "<|reserved_special_token_1|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128004": {
- "content": "<|finetune_right_pad_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128005": {
- "content": "<|reserved_special_token_2|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128006": {
- "content": "<|start_header_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128007": {
- "content": "<|end_header_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128008": {
- "content": "<|eom_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128009": {
- "content": "<|eot_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128010": {
- "content": "<|python_tag|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128011": {
- "content": "<|reserved_special_token_3|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128012": {
- "content": "<|reserved_special_token_4|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128013": {
- "content": "<|reserved_special_token_5|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128014": {
- "content": "<|reserved_special_token_6|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128015": {
- "content": "<|reserved_special_token_7|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128016": {
- "content": "<|reserved_special_token_8|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128017": {
- "content": "<|reserved_special_token_9|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128018": {
- "content": "<|reserved_special_token_10|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128019": {
- "content": "<|reserved_special_token_11|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128020": {
- "content": "<|reserved_special_token_12|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128021": {
- "content": "<|reserved_special_token_13|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128022": {
- "content": "<|reserved_special_token_14|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128023": {
- "content": "<|reserved_special_token_15|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128024": {
- "content": "<|reserved_special_token_16|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128025": {
- "content": "<|reserved_special_token_17|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128026": {
- "content": "<|reserved_special_token_18|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128027": {
- "content": "<|reserved_special_token_19|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128028": {
- "content": "<|reserved_special_token_20|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128029": {
- "content": "<|reserved_special_token_21|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128030": {
- "content": "<|reserved_special_token_22|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128031": {
- "content": "<|reserved_special_token_23|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128032": {
- "content": "<|reserved_special_token_24|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128033": {
- "content": "<|reserved_special_token_25|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128034": {
- "content": "<|reserved_special_token_26|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128035": {
- "content": "<|reserved_special_token_27|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128036": {
- "content": "<|reserved_special_token_28|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128037": {
- "content": "<|reserved_special_token_29|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128038": {
- "content": "<|reserved_special_token_30|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128039": {
- "content": "<|reserved_special_token_31|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128040": {
- "content": "<|reserved_special_token_32|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128041": {
- "content": "<|reserved_special_token_33|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128042": {
- "content": "<|reserved_special_token_34|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128043": {
- "content": "<|reserved_special_token_35|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128044": {
- "content": "<|reserved_special_token_36|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128045": {
- "content": "<|reserved_special_token_37|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128046": {
- "content": "<|reserved_special_token_38|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128047": {
- "content": "<|reserved_special_token_39|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128048": {
- "content": "<|reserved_special_token_40|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128049": {
- "content": "<|reserved_special_token_41|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128050": {
- "content": "<|reserved_special_token_42|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128051": {
- "content": "<|reserved_special_token_43|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128052": {
- "content": "<|reserved_special_token_44|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128053": {
- "content": "<|reserved_special_token_45|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128054": {
- "content": "<|reserved_special_token_46|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128055": {
- "content": "<|reserved_special_token_47|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128056": {
- "content": "<|reserved_special_token_48|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128057": {
- "content": "<|reserved_special_token_49|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128058": {
- "content": "<|reserved_special_token_50|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128059": {
- "content": "<|reserved_special_token_51|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128060": {
- "content": "<|reserved_special_token_52|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128061": {
- "content": "<|reserved_special_token_53|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128062": {
- "content": "<|reserved_special_token_54|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128063": {
- "content": "<|reserved_special_token_55|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128064": {
- "content": "<|reserved_special_token_56|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128065": {
- "content": "<|reserved_special_token_57|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128066": {
- "content": "<|reserved_special_token_58|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128067": {
- "content": "<|reserved_special_token_59|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128068": {
- "content": "<|reserved_special_token_60|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128069": {
- "content": "<|reserved_special_token_61|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128070": {
- "content": "<|reserved_special_token_62|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128071": {
- "content": "<|reserved_special_token_63|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128072": {
- "content": "<|reserved_special_token_64|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128073": {
- "content": "<|reserved_special_token_65|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128074": {
- "content": "<|reserved_special_token_66|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128075": {
- "content": "<|reserved_special_token_67|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128076": {
- "content": "<|reserved_special_token_68|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128077": {
- "content": "<|reserved_special_token_69|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128078": {
- "content": "<|reserved_special_token_70|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128079": {
- "content": "<|reserved_special_token_71|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128080": {
- "content": "<|reserved_special_token_72|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128081": {
- "content": "<|reserved_special_token_73|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128082": {
- "content": "<|reserved_special_token_74|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128083": {
- "content": "<|reserved_special_token_75|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128084": {
- "content": "<|reserved_special_token_76|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128085": {
- "content": "<|reserved_special_token_77|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128086": {
- "content": "<|reserved_special_token_78|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128087": {
- "content": "<|reserved_special_token_79|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128088": {
- "content": "<|reserved_special_token_80|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128089": {
- "content": "<|reserved_special_token_81|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128090": {
- "content": "<|reserved_special_token_82|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128091": {
- "content": "<|reserved_special_token_83|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128092": {
- "content": "<|reserved_special_token_84|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128093": {
- "content": "<|reserved_special_token_85|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128094": {
- "content": "<|reserved_special_token_86|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128095": {
- "content": "<|reserved_special_token_87|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128096": {
- "content": "<|reserved_special_token_88|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128097": {
- "content": "<|reserved_special_token_89|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128098": {
- "content": "<|reserved_special_token_90|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128099": {
- "content": "<|reserved_special_token_91|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128100": {
- "content": "<|reserved_special_token_92|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128101": {
- "content": "<|reserved_special_token_93|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128102": {
- "content": "<|reserved_special_token_94|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128103": {
- "content": "<|reserved_special_token_95|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128104": {
- "content": "<|reserved_special_token_96|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128105": {
- "content": "<|reserved_special_token_97|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128106": {
- "content": "<|reserved_special_token_98|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128107": {
- "content": "<|reserved_special_token_99|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128108": {
- "content": "<|reserved_special_token_100|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128109": {
- "content": "<|reserved_special_token_101|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128110": {
- "content": "<|reserved_special_token_102|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128111": {
- "content": "<|reserved_special_token_103|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128112": {
- "content": "<|reserved_special_token_104|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128113": {
- "content": "<|reserved_special_token_105|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128114": {
- "content": "<|reserved_special_token_106|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128115": {
- "content": "<|reserved_special_token_107|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128116": {
- "content": "<|reserved_special_token_108|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128117": {
- "content": "<|reserved_special_token_109|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128118": {
- "content": "<|reserved_special_token_110|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128119": {
- "content": "<|reserved_special_token_111|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128120": {
- "content": "<|reserved_special_token_112|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128121": {
- "content": "<|reserved_special_token_113|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128122": {
- "content": "<|reserved_special_token_114|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128123": {
- "content": "<|reserved_special_token_115|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128124": {
- "content": "<|reserved_special_token_116|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128125": {
- "content": "<|reserved_special_token_117|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128126": {
- "content": "<|reserved_special_token_118|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128127": {
- "content": "<|reserved_special_token_119|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128128": {
- "content": "<|reserved_special_token_120|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128129": {
- "content": "<|reserved_special_token_121|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128130": {
- "content": "<|reserved_special_token_122|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128131": {
- "content": "<|reserved_special_token_123|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128132": {
- "content": "<|reserved_special_token_124|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128133": {
- "content": "<|reserved_special_token_125|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128134": {
- "content": "<|reserved_special_token_126|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128135": {
- "content": "<|reserved_special_token_127|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128136": {
- "content": "<|reserved_special_token_128|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128137": {
- "content": "<|reserved_special_token_129|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128138": {
- "content": "<|reserved_special_token_130|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128139": {
- "content": "<|reserved_special_token_131|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128140": {
- "content": "<|reserved_special_token_132|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128141": {
- "content": "<|reserved_special_token_133|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128142": {
- "content": "<|reserved_special_token_134|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128143": {
- "content": "<|reserved_special_token_135|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128144": {
- "content": "<|reserved_special_token_136|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128145": {
- "content": "<|reserved_special_token_137|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128146": {
- "content": "<|reserved_special_token_138|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128147": {
- "content": "<|reserved_special_token_139|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128148": {
- "content": "<|reserved_special_token_140|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128149": {
- "content": "<|reserved_special_token_141|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128150": {
- "content": "<|reserved_special_token_142|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128151": {
- "content": "<|reserved_special_token_143|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128152": {
- "content": "<|reserved_special_token_144|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128153": {
- "content": "<|reserved_special_token_145|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128154": {
- "content": "<|reserved_special_token_146|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128155": {
- "content": "<|reserved_special_token_147|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128156": {
- "content": "<|reserved_special_token_148|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128157": {
- "content": "<|reserved_special_token_149|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128158": {
- "content": "<|reserved_special_token_150|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128159": {
- "content": "<|reserved_special_token_151|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128160": {
- "content": "<|reserved_special_token_152|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128161": {
- "content": "<|reserved_special_token_153|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128162": {
- "content": "<|reserved_special_token_154|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128163": {
- "content": "<|reserved_special_token_155|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128164": {
- "content": "<|reserved_special_token_156|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128165": {
- "content": "<|reserved_special_token_157|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128166": {
- "content": "<|reserved_special_token_158|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128167": {
- "content": "<|reserved_special_token_159|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128168": {
- "content": "<|reserved_special_token_160|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128169": {
- "content": "<|reserved_special_token_161|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128170": {
- "content": "<|reserved_special_token_162|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128171": {
- "content": "<|reserved_special_token_163|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128172": {
- "content": "<|reserved_special_token_164|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128173": {
- "content": "<|reserved_special_token_165|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128174": {
- "content": "<|reserved_special_token_166|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128175": {
- "content": "<|reserved_special_token_167|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128176": {
- "content": "<|reserved_special_token_168|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128177": {
- "content": "<|reserved_special_token_169|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128178": {
- "content": "<|reserved_special_token_170|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128179": {
- "content": "<|reserved_special_token_171|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128180": {
- "content": "<|reserved_special_token_172|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128181": {
- "content": "<|reserved_special_token_173|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128182": {
- "content": "<|reserved_special_token_174|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128183": {
- "content": "<|reserved_special_token_175|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128184": {
- "content": "<|reserved_special_token_176|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128185": {
- "content": "<|reserved_special_token_177|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128186": {
- "content": "<|reserved_special_token_178|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128187": {
- "content": "<|reserved_special_token_179|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128188": {
- "content": "<|reserved_special_token_180|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128189": {
- "content": "<|reserved_special_token_181|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128190": {
- "content": "<|reserved_special_token_182|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128191": {
- "content": "<|reserved_special_token_183|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128192": {
- "content": "<|reserved_special_token_184|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128193": {
- "content": "<|reserved_special_token_185|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128194": {
- "content": "<|reserved_special_token_186|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128195": {
- "content": "<|reserved_special_token_187|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128196": {
- "content": "<|reserved_special_token_188|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128197": {
- "content": "<|reserved_special_token_189|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128198": {
- "content": "<|reserved_special_token_190|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128199": {
- "content": "<|reserved_special_token_191|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128200": {
- "content": "<|reserved_special_token_192|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128201": {
- "content": "<|reserved_special_token_193|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128202": {
- "content": "<|reserved_special_token_194|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128203": {
- "content": "<|reserved_special_token_195|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128204": {
- "content": "<|reserved_special_token_196|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128205": {
- "content": "<|reserved_special_token_197|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128206": {
- "content": "<|reserved_special_token_198|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128207": {
- "content": "<|reserved_special_token_199|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128208": {
- "content": "<|reserved_special_token_200|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128209": {
- "content": "<|reserved_special_token_201|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128210": {
- "content": "<|reserved_special_token_202|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128211": {
- "content": "<|reserved_special_token_203|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128212": {
- "content": "<|reserved_special_token_204|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128213": {
- "content": "<|reserved_special_token_205|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128214": {
- "content": "<|reserved_special_token_206|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128215": {
- "content": "<|reserved_special_token_207|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128216": {
- "content": "<|reserved_special_token_208|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128217": {
- "content": "<|reserved_special_token_209|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128218": {
- "content": "<|reserved_special_token_210|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128219": {
- "content": "<|reserved_special_token_211|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128220": {
- "content": "<|reserved_special_token_212|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128221": {
- "content": "<|reserved_special_token_213|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128222": {
- "content": "<|reserved_special_token_214|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128223": {
- "content": "<|reserved_special_token_215|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128224": {
- "content": "<|reserved_special_token_216|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128225": {
- "content": "<|reserved_special_token_217|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128226": {
- "content": "<|reserved_special_token_218|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128227": {
- "content": "<|reserved_special_token_219|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128228": {
- "content": "<|reserved_special_token_220|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128229": {
- "content": "<|reserved_special_token_221|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128230": {
- "content": "<|reserved_special_token_222|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128231": {
- "content": "<|reserved_special_token_223|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128232": {
- "content": "<|reserved_special_token_224|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128233": {
- "content": "<|reserved_special_token_225|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128234": {
- "content": "<|reserved_special_token_226|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128235": {
- "content": "<|reserved_special_token_227|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128236": {
- "content": "<|reserved_special_token_228|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128237": {
- "content": "<|reserved_special_token_229|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128238": {
- "content": "<|reserved_special_token_230|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128239": {
- "content": "<|reserved_special_token_231|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128240": {
- "content": "<|reserved_special_token_232|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128241": {
- "content": "<|reserved_special_token_233|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128242": {
- "content": "<|reserved_special_token_234|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128243": {
- "content": "<|reserved_special_token_235|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128244": {
- "content": "<|reserved_special_token_236|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128245": {
- "content": "<|reserved_special_token_237|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128246": {
- "content": "<|reserved_special_token_238|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128247": {
- "content": "<|reserved_special_token_239|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128248": {
- "content": "<|reserved_special_token_240|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128249": {
- "content": "<|reserved_special_token_241|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128250": {
- "content": "<|reserved_special_token_242|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128251": {
- "content": "<|reserved_special_token_243|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128252": {
- "content": "<|reserved_special_token_244|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128253": {
- "content": "<|reserved_special_token_245|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128254": {
- "content": "<|reserved_special_token_246|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128255": {
- "content": "<|reserved_special_token_247|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- }
- },
- "bos_token": "<|begin_of_text|>",
- "clean_up_tokenization_spaces": true,
- "eos_token": "<|eot_id|>",
- "extra_special_tokens": {},
- "model_input_names": [
- "input_ids",
- "attention_mask"
- ],
- "model_max_length": 131072,
- "pad_token": "<|eot_id|>",
- "tokenizer_class": "PreTrainedTokenizerFast"
-}
diff --git a/checkpoint-300/trainer_state.json b/checkpoint-300/trainer_state.json
deleted file mode 100644
index 19c01d505ad92122929d029d241bfd9151c6e278..0000000000000000000000000000000000000000
--- a/checkpoint-300/trainer_state.json
+++ /dev/null
@@ -1,292 +0,0 @@
-{
- "best_global_step": 50,
- "best_metric": 0.7558398842811584,
- "best_model_checkpoint": null,
- "epoch": 30.0,
- "eval_steps": 50,
- "global_step": 300,
- "is_hyper_param_search": false,
- "is_local_process_zero": true,
- "is_world_process_zero": true,
- "log_history": [
- {
- "epoch": 1.0,
- "grad_norm": 1.4660576581954956,
- "learning_rate": 3.6e-05,
- "loss": 1.152,
- "step": 10
- },
- {
- "epoch": 2.0,
- "grad_norm": 0.8749533295631409,
- "learning_rate": 7.6e-05,
- "loss": 1.0421,
- "step": 20
- },
- {
- "epoch": 3.0,
- "grad_norm": 3.37060284614563,
- "learning_rate": 0.000116,
- "loss": 0.8539,
- "step": 30
- },
- {
- "epoch": 4.0,
- "grad_norm": 1.5355278253555298,
- "learning_rate": 0.00015600000000000002,
- "loss": 0.5483,
- "step": 40
- },
- {
- "epoch": 5.0,
- "grad_norm": 2.454838514328003,
- "learning_rate": 0.000196,
- "loss": 0.3736,
- "step": 50
- },
- {
- "epoch": 5.0,
- "eval_loss": 0.7558398842811584,
- "eval_runtime": 1.7227,
- "eval_samples_per_second": 2.902,
- "eval_steps_per_second": 2.902,
- "step": 50
- },
- {
- "epoch": 6.0,
- "grad_norm": 3.676417827606201,
- "learning_rate": 0.000196,
- "loss": 0.2291,
- "step": 60
- },
- {
- "epoch": 7.0,
- "grad_norm": 2.192375898361206,
- "learning_rate": 0.00019155555555555554,
- "loss": 0.1244,
- "step": 70
- },
- {
- "epoch": 8.0,
- "grad_norm": 2.630005359649658,
- "learning_rate": 0.00018711111111111112,
- "loss": 0.0862,
- "step": 80
- },
- {
- "epoch": 9.0,
- "grad_norm": 0.5021786093711853,
- "learning_rate": 0.00018266666666666667,
- "loss": 0.0614,
- "step": 90
- },
- {
- "epoch": 10.0,
- "grad_norm": 0.38170942664146423,
- "learning_rate": 0.00017822222222222222,
- "loss": 0.0471,
- "step": 100
- },
- {
- "epoch": 10.0,
- "eval_loss": 0.8806974291801453,
- "eval_runtime": 1.7764,
- "eval_samples_per_second": 2.815,
- "eval_steps_per_second": 2.815,
- "step": 100
- },
- {
- "epoch": 11.0,
- "grad_norm": 1.223647952079773,
- "learning_rate": 0.0001737777777777778,
- "loss": 0.0359,
- "step": 110
- },
- {
- "epoch": 12.0,
- "grad_norm": 0.5452818870544434,
- "learning_rate": 0.00016933333333333335,
- "loss": 0.0289,
- "step": 120
- },
- {
- "epoch": 13.0,
- "grad_norm": 0.19034886360168457,
- "learning_rate": 0.0001648888888888889,
- "loss": 0.029,
- "step": 130
- },
- {
- "epoch": 14.0,
- "grad_norm": 0.7483140230178833,
- "learning_rate": 0.00016044444444444445,
- "loss": 0.0247,
- "step": 140
- },
- {
- "epoch": 15.0,
- "grad_norm": 0.34800082445144653,
- "learning_rate": 0.00015600000000000002,
- "loss": 0.0193,
- "step": 150
- },
- {
- "epoch": 15.0,
- "eval_loss": 0.9916993379592896,
- "eval_runtime": 1.7667,
- "eval_samples_per_second": 2.83,
- "eval_steps_per_second": 2.83,
- "step": 150
- },
- {
- "epoch": 16.0,
- "grad_norm": 0.24237586557865143,
- "learning_rate": 0.00015155555555555557,
- "loss": 0.0176,
- "step": 160
- },
- {
- "epoch": 17.0,
- "grad_norm": 0.13607177138328552,
- "learning_rate": 0.00014711111111111112,
- "loss": 0.0131,
- "step": 170
- },
- {
- "epoch": 18.0,
- "grad_norm": 0.3655266761779785,
- "learning_rate": 0.00014266666666666667,
- "loss": 0.0164,
- "step": 180
- },
- {
- "epoch": 19.0,
- "grad_norm": 0.08258651196956635,
- "learning_rate": 0.00013822222222222222,
- "loss": 0.013,
- "step": 190
- },
- {
- "epoch": 20.0,
- "grad_norm": 0.1830163151025772,
- "learning_rate": 0.00013377777777777777,
- "loss": 0.0126,
- "step": 200
- },
- {
- "epoch": 20.0,
- "eval_loss": 1.0726474523544312,
- "eval_runtime": 1.7657,
- "eval_samples_per_second": 2.832,
- "eval_steps_per_second": 2.832,
- "step": 200
- },
- {
- "epoch": 21.0,
- "grad_norm": 0.12009257823228836,
- "learning_rate": 0.00012933333333333332,
- "loss": 0.0108,
- "step": 210
- },
- {
- "epoch": 22.0,
- "grad_norm": 0.1172371432185173,
- "learning_rate": 0.0001248888888888889,
- "loss": 0.0122,
- "step": 220
- },
- {
- "epoch": 23.0,
- "grad_norm": 0.14445751905441284,
- "learning_rate": 0.00012044444444444445,
- "loss": 0.0121,
- "step": 230
- },
- {
- "epoch": 24.0,
- "grad_norm": 0.18198293447494507,
- "learning_rate": 0.000116,
- "loss": 0.0128,
- "step": 240
- },
- {
- "epoch": 25.0,
- "grad_norm": 0.1562514454126358,
- "learning_rate": 0.00011155555555555556,
- "loss": 0.0117,
- "step": 250
- },
- {
- "epoch": 25.0,
- "eval_loss": 1.106227159500122,
- "eval_runtime": 1.7564,
- "eval_samples_per_second": 2.847,
- "eval_steps_per_second": 2.847,
- "step": 250
- },
- {
- "epoch": 26.0,
- "grad_norm": 0.06052432581782341,
- "learning_rate": 0.00010711111111111111,
- "loss": 0.0123,
- "step": 260
- },
- {
- "epoch": 27.0,
- "grad_norm": 0.03066837601363659,
- "learning_rate": 0.00010266666666666666,
- "loss": 0.0106,
- "step": 270
- },
- {
- "epoch": 28.0,
- "grad_norm": 0.034792304039001465,
- "learning_rate": 9.822222222222223e-05,
- "loss": 0.0124,
- "step": 280
- },
- {
- "epoch": 29.0,
- "grad_norm": 0.028368409723043442,
- "learning_rate": 9.377777777777779e-05,
- "loss": 0.0107,
- "step": 290
- },
- {
- "epoch": 30.0,
- "grad_norm": 0.03258921578526497,
- "learning_rate": 8.933333333333334e-05,
- "loss": 0.0109,
- "step": 300
- },
- {
- "epoch": 30.0,
- "eval_loss": 1.1306606531143188,
- "eval_runtime": 1.7675,
- "eval_samples_per_second": 2.829,
- "eval_steps_per_second": 2.829,
- "step": 300
- }
- ],
- "logging_steps": 10,
- "max_steps": 500,
- "num_input_tokens_seen": 0,
- "num_train_epochs": 50,
- "save_steps": 100,
- "stateful_callbacks": {
- "TrainerControl": {
- "args": {
- "should_epoch_stop": false,
- "should_evaluate": false,
- "should_log": false,
- "should_save": true,
- "should_training_stop": false
- },
- "attributes": {}
- }
- },
- "total_flos": 3.982651174158336e+16,
- "train_batch_size": 1,
- "trial_name": null,
- "trial_params": null
-}
diff --git a/checkpoint-300/training_args.bin b/checkpoint-300/training_args.bin
deleted file mode 100644
index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000
--- a/checkpoint-300/training_args.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f
-size 5777
diff --git a/checkpoint-400/README.md b/checkpoint-400/README.md
deleted file mode 100644
index da869e54abd54b0fea18dcc9516b16918f684370..0000000000000000000000000000000000000000
--- a/checkpoint-400/README.md
+++ /dev/null
@@ -1,207 +0,0 @@
----
-base_model: meta-llama/Llama-3.2-3B-Instruct
-library_name: peft
-pipeline_tag: text-generation
-tags:
-- base_model:adapter:meta-llama/Llama-3.2-3B-Instruct
-- lora
-- transformers
----
-
-# Model Card for Model ID
-
-
-
-
-
-## Model Details
-
-### Model Description
-
-
-
-
-
-- **Developed by:** [More Information Needed]
-- **Funded by [optional]:** [More Information Needed]
-- **Shared by [optional]:** [More Information Needed]
-- **Model type:** [More Information Needed]
-- **Language(s) (NLP):** [More Information Needed]
-- **License:** [More Information Needed]
-- **Finetuned from model [optional]:** [More Information Needed]
-
-### Model Sources [optional]
-
-
-
-- **Repository:** [More Information Needed]
-- **Paper [optional]:** [More Information Needed]
-- **Demo [optional]:** [More Information Needed]
-
-## Uses
-
-
-
-### Direct Use
-
-
-
-[More Information Needed]
-
-### Downstream Use [optional]
-
-
-
-[More Information Needed]
-
-### Out-of-Scope Use
-
-
-
-[More Information Needed]
-
-## Bias, Risks, and Limitations
-
-
-
-[More Information Needed]
-
-### Recommendations
-
-
-
-Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
-
-## How to Get Started with the Model
-
-Use the code below to get started with the model.
-
-[More Information Needed]
-
-## Training Details
-
-### Training Data
-
-
-
-[More Information Needed]
-
-### Training Procedure
-
-
-
-#### Preprocessing [optional]
-
-[More Information Needed]
-
-
-#### Training Hyperparameters
-
-- **Training regime:** [More Information Needed]
-
-#### Speeds, Sizes, Times [optional]
-
-
-
-[More Information Needed]
-
-## Evaluation
-
-
-
-### Testing Data, Factors & Metrics
-
-#### Testing Data
-
-
-
-[More Information Needed]
-
-#### Factors
-
-
-
-[More Information Needed]
-
-#### Metrics
-
-
-
-[More Information Needed]
-
-### Results
-
-[More Information Needed]
-
-#### Summary
-
-
-
-## Model Examination [optional]
-
-
-
-[More Information Needed]
-
-## Environmental Impact
-
-
-
-Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
-
-- **Hardware Type:** [More Information Needed]
-- **Hours used:** [More Information Needed]
-- **Cloud Provider:** [More Information Needed]
-- **Compute Region:** [More Information Needed]
-- **Carbon Emitted:** [More Information Needed]
-
-## Technical Specifications [optional]
-
-### Model Architecture and Objective
-
-[More Information Needed]
-
-### Compute Infrastructure
-
-[More Information Needed]
-
-#### Hardware
-
-[More Information Needed]
-
-#### Software
-
-[More Information Needed]
-
-## Citation [optional]
-
-
-
-**BibTeX:**
-
-[More Information Needed]
-
-**APA:**
-
-[More Information Needed]
-
-## Glossary [optional]
-
-
-
-[More Information Needed]
-
-## More Information [optional]
-
-[More Information Needed]
-
-## Model Card Authors [optional]
-
-[More Information Needed]
-
-## Model Card Contact
-
-[More Information Needed]
-### Framework versions
-
-- PEFT 0.17.1
\ No newline at end of file
diff --git a/checkpoint-400/adapter_config.json b/checkpoint-400/adapter_config.json
deleted file mode 100644
index c9a27d527a89fd0081c994e17bd2b908b8038d6e..0000000000000000000000000000000000000000
--- a/checkpoint-400/adapter_config.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
- "alpha_pattern": {},
- "auto_mapping": null,
- "base_model_name_or_path": "meta-llama/Llama-3.2-3B-Instruct",
- "bias": "none",
- "corda_config": null,
- "eva_config": null,
- "exclude_modules": null,
- "fan_in_fan_out": false,
- "inference_mode": true,
- "init_lora_weights": true,
- "layer_replication": null,
- "layers_pattern": null,
- "layers_to_transform": null,
- "loftq_config": {},
- "lora_alpha": 32,
- "lora_bias": false,
- "lora_dropout": 0.1,
- "megatron_config": null,
- "megatron_core": "megatron.core",
- "modules_to_save": null,
- "peft_type": "LORA",
- "qalora_group_size": 16,
- "r": 16,
- "rank_pattern": {},
- "revision": null,
- "target_modules": [
- "down_proj",
- "v_proj",
- "q_proj",
- "k_proj",
- "gate_proj",
- "o_proj",
- "up_proj"
- ],
- "target_parameters": null,
- "task_type": "CAUSAL_LM",
- "trainable_token_indices": null,
- "use_dora": false,
- "use_qalora": false,
- "use_rslora": false
-}
\ No newline at end of file
diff --git a/checkpoint-400/adapter_model.safetensors b/checkpoint-400/adapter_model.safetensors
deleted file mode 100644
index 2bdf98938412f41cdad1d039985e9ca6e4ae8cfc..0000000000000000000000000000000000000000
--- a/checkpoint-400/adapter_model.safetensors
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:b09ec477371bdfadd7438ffd8a17ffa23db183558c378efb88851aa2f0878c67
-size 97307544
diff --git a/checkpoint-400/chat_template.jinja b/checkpoint-400/chat_template.jinja
deleted file mode 100644
index 1bad6a0f648dccdbec523ca79ba90fbcfc806af0..0000000000000000000000000000000000000000
--- a/checkpoint-400/chat_template.jinja
+++ /dev/null
@@ -1,93 +0,0 @@
-{{- bos_token }}
-{%- if custom_tools is defined %}
- {%- set tools = custom_tools %}
-{%- endif %}
-{%- if not tools_in_user_message is defined %}
- {%- set tools_in_user_message = true %}
-{%- endif %}
-{%- if not date_string is defined %}
- {%- if strftime_now is defined %}
- {%- set date_string = strftime_now("%d %b %Y") %}
- {%- else %}
- {%- set date_string = "26 Jul 2024" %}
- {%- endif %}
-{%- endif %}
-{%- if not tools is defined %}
- {%- set tools = none %}
-{%- endif %}
-
-{#- This block extracts the system message, so we can slot it into the right place. #}
-{%- if messages[0]['role'] == 'system' %}
- {%- set system_message = messages[0]['content']|trim %}
- {%- set messages = messages[1:] %}
-{%- else %}
- {%- set system_message = "" %}
-{%- endif %}
-
-{#- System message #}
-{{- "<|start_header_id|>system<|end_header_id|>\n\n" }}
-{%- if tools is not none %}
- {{- "Environment: ipython\n" }}
-{%- endif %}
-{{- "Cutting Knowledge Date: December 2023\n" }}
-{{- "Today Date: " + date_string + "\n\n" }}
-{%- if tools is not none and not tools_in_user_message %}
- {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
- {{- "Do not use variables.\n\n" }}
- {%- for t in tools %}
- {{- t | tojson(indent=4) }}
- {{- "\n\n" }}
- {%- endfor %}
-{%- endif %}
-{{- system_message }}
-{{- "<|eot_id|>" }}
-
-{#- Custom tools are passed in a user message with some extra guidance #}
-{%- if tools_in_user_message and not tools is none %}
- {#- Extract the first user message so we can plug it in here #}
- {%- if messages | length != 0 %}
- {%- set first_user_message = messages[0]['content']|trim %}
- {%- set messages = messages[1:] %}
- {%- else %}
- {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }}
-{%- endif %}
- {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}
- {{- "Given the following functions, please respond with a JSON for a function call " }}
- {{- "with its proper arguments that best answers the given prompt.\n\n" }}
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
- {{- "Do not use variables.\n\n" }}
- {%- for t in tools %}
- {{- t | tojson(indent=4) }}
- {{- "\n\n" }}
- {%- endfor %}
- {{- first_user_message + "<|eot_id|>"}}
-{%- endif %}
-
-{%- for message in messages %}
- {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}
- {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }}
- {%- elif 'tool_calls' in message %}
- {%- if not message.tool_calls|length == 1 %}
- {{- raise_exception("This model only supports single tool-calls at once!") }}
- {%- endif %}
- {%- set tool_call = message.tool_calls[0].function %}
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}
- {{- '{"name": "' + tool_call.name + '", ' }}
- {{- '"parameters": ' }}
- {{- tool_call.arguments | tojson }}
- {{- "}" }}
- {{- "<|eot_id|>" }}
- {%- elif message.role == "tool" or message.role == "ipython" %}
- {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }}
- {%- if message.content is mapping or message.content is iterable %}
- {{- message.content | tojson }}
- {%- else %}
- {{- message.content }}
- {%- endif %}
- {{- "<|eot_id|>" }}
- {%- endif %}
-{%- endfor %}
-{%- if add_generation_prompt %}
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}
-{%- endif %}
diff --git a/checkpoint-400/optimizer.pt b/checkpoint-400/optimizer.pt
deleted file mode 100644
index 4ba2f96b88a00a983fe9e9439f4f034f5cc2a620..0000000000000000000000000000000000000000
--- a/checkpoint-400/optimizer.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:1749edc7d7adb361c013e5d65cd9069566799ebea20c3ae8bb3e5eb9ea6d2514
-size 194846331
diff --git a/checkpoint-400/rng_state.pth b/checkpoint-400/rng_state.pth
deleted file mode 100644
index 2606109424f937f1bc52c93bea33a5d97a80968f..0000000000000000000000000000000000000000
--- a/checkpoint-400/rng_state.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:1d4b1ffec63a9c901fcbc38e47d8abd2121fc84af05caaa0e7adce9ba19650e1
-size 14645
diff --git a/checkpoint-400/scaler.pt b/checkpoint-400/scaler.pt
deleted file mode 100644
index 0b0bfee2584fa7aba2e3ab882380cdc54add60e0..0000000000000000000000000000000000000000
--- a/checkpoint-400/scaler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:30858f23bcb22d0baef45bd4add9d6fa474141308c12653c706077b87d932e49
-size 1383
diff --git a/checkpoint-400/scheduler.pt b/checkpoint-400/scheduler.pt
deleted file mode 100644
index b4e8cfd932581e913336ce2133d36088daa2c2a5..0000000000000000000000000000000000000000
--- a/checkpoint-400/scheduler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:aa8793d08d90abcd0fe6bf5d2eb9e6c925d0781705a129dc03f5ec30bc5e94ba
-size 1465
diff --git a/checkpoint-400/special_tokens_map.json b/checkpoint-400/special_tokens_map.json
deleted file mode 100644
index b43be96621d147110fb8a18b5776ec6e38516127..0000000000000000000000000000000000000000
--- a/checkpoint-400/special_tokens_map.json
+++ /dev/null
@@ -1,17 +0,0 @@
-{
- "bos_token": {
- "content": "<|begin_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "eos_token": {
- "content": "<|eot_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "pad_token": "<|eot_id|>"
-}
diff --git a/checkpoint-400/tokenizer.json b/checkpoint-400/tokenizer.json
deleted file mode 100644
index 8e89913d63cf04862fcbf301032ee349780489f2..0000000000000000000000000000000000000000
--- a/checkpoint-400/tokenizer.json
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:912e72517f7521f3273166a7879fe54c52b397f8c48ea80f8f1ed794beb24c09
-size 17210184
diff --git a/checkpoint-400/tokenizer_config.json b/checkpoint-400/tokenizer_config.json
deleted file mode 100644
index 3beeacc86a6ca3cae14ad3004263ab74a4bac07a..0000000000000000000000000000000000000000
--- a/checkpoint-400/tokenizer_config.json
+++ /dev/null
@@ -1,2063 +0,0 @@
-{
- "added_tokens_decoder": {
- "128000": {
- "content": "<|begin_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128001": {
- "content": "<|end_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128002": {
- "content": "<|reserved_special_token_0|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128003": {
- "content": "<|reserved_special_token_1|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128004": {
- "content": "<|finetune_right_pad_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128005": {
- "content": "<|reserved_special_token_2|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128006": {
- "content": "<|start_header_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128007": {
- "content": "<|end_header_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128008": {
- "content": "<|eom_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128009": {
- "content": "<|eot_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128010": {
- "content": "<|python_tag|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128011": {
- "content": "<|reserved_special_token_3|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128012": {
- "content": "<|reserved_special_token_4|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128013": {
- "content": "<|reserved_special_token_5|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128014": {
- "content": "<|reserved_special_token_6|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128015": {
- "content": "<|reserved_special_token_7|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128016": {
- "content": "<|reserved_special_token_8|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128017": {
- "content": "<|reserved_special_token_9|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128018": {
- "content": "<|reserved_special_token_10|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128019": {
- "content": "<|reserved_special_token_11|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128020": {
- "content": "<|reserved_special_token_12|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128021": {
- "content": "<|reserved_special_token_13|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128022": {
- "content": "<|reserved_special_token_14|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128023": {
- "content": "<|reserved_special_token_15|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128024": {
- "content": "<|reserved_special_token_16|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128025": {
- "content": "<|reserved_special_token_17|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128026": {
- "content": "<|reserved_special_token_18|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128027": {
- "content": "<|reserved_special_token_19|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128028": {
- "content": "<|reserved_special_token_20|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128029": {
- "content": "<|reserved_special_token_21|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128030": {
- "content": "<|reserved_special_token_22|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128031": {
- "content": "<|reserved_special_token_23|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128032": {
- "content": "<|reserved_special_token_24|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128033": {
- "content": "<|reserved_special_token_25|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128034": {
- "content": "<|reserved_special_token_26|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128035": {
- "content": "<|reserved_special_token_27|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128036": {
- "content": "<|reserved_special_token_28|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128037": {
- "content": "<|reserved_special_token_29|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128038": {
- "content": "<|reserved_special_token_30|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128039": {
- "content": "<|reserved_special_token_31|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128040": {
- "content": "<|reserved_special_token_32|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128041": {
- "content": "<|reserved_special_token_33|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128042": {
- "content": "<|reserved_special_token_34|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128043": {
- "content": "<|reserved_special_token_35|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128044": {
- "content": "<|reserved_special_token_36|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128045": {
- "content": "<|reserved_special_token_37|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128046": {
- "content": "<|reserved_special_token_38|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128047": {
- "content": "<|reserved_special_token_39|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128048": {
- "content": "<|reserved_special_token_40|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128049": {
- "content": "<|reserved_special_token_41|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128050": {
- "content": "<|reserved_special_token_42|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128051": {
- "content": "<|reserved_special_token_43|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128052": {
- "content": "<|reserved_special_token_44|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128053": {
- "content": "<|reserved_special_token_45|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128054": {
- "content": "<|reserved_special_token_46|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128055": {
- "content": "<|reserved_special_token_47|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128056": {
- "content": "<|reserved_special_token_48|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128057": {
- "content": "<|reserved_special_token_49|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128058": {
- "content": "<|reserved_special_token_50|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128059": {
- "content": "<|reserved_special_token_51|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128060": {
- "content": "<|reserved_special_token_52|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128061": {
- "content": "<|reserved_special_token_53|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128062": {
- "content": "<|reserved_special_token_54|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128063": {
- "content": "<|reserved_special_token_55|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128064": {
- "content": "<|reserved_special_token_56|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128065": {
- "content": "<|reserved_special_token_57|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128066": {
- "content": "<|reserved_special_token_58|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128067": {
- "content": "<|reserved_special_token_59|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128068": {
- "content": "<|reserved_special_token_60|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128069": {
- "content": "<|reserved_special_token_61|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128070": {
- "content": "<|reserved_special_token_62|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128071": {
- "content": "<|reserved_special_token_63|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128072": {
- "content": "<|reserved_special_token_64|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128073": {
- "content": "<|reserved_special_token_65|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128074": {
- "content": "<|reserved_special_token_66|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128075": {
- "content": "<|reserved_special_token_67|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128076": {
- "content": "<|reserved_special_token_68|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128077": {
- "content": "<|reserved_special_token_69|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128078": {
- "content": "<|reserved_special_token_70|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128079": {
- "content": "<|reserved_special_token_71|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128080": {
- "content": "<|reserved_special_token_72|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128081": {
- "content": "<|reserved_special_token_73|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128082": {
- "content": "<|reserved_special_token_74|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128083": {
- "content": "<|reserved_special_token_75|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128084": {
- "content": "<|reserved_special_token_76|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128085": {
- "content": "<|reserved_special_token_77|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128086": {
- "content": "<|reserved_special_token_78|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128087": {
- "content": "<|reserved_special_token_79|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128088": {
- "content": "<|reserved_special_token_80|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128089": {
- "content": "<|reserved_special_token_81|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128090": {
- "content": "<|reserved_special_token_82|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128091": {
- "content": "<|reserved_special_token_83|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128092": {
- "content": "<|reserved_special_token_84|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128093": {
- "content": "<|reserved_special_token_85|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128094": {
- "content": "<|reserved_special_token_86|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128095": {
- "content": "<|reserved_special_token_87|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128096": {
- "content": "<|reserved_special_token_88|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128097": {
- "content": "<|reserved_special_token_89|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128098": {
- "content": "<|reserved_special_token_90|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128099": {
- "content": "<|reserved_special_token_91|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128100": {
- "content": "<|reserved_special_token_92|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128101": {
- "content": "<|reserved_special_token_93|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128102": {
- "content": "<|reserved_special_token_94|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128103": {
- "content": "<|reserved_special_token_95|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128104": {
- "content": "<|reserved_special_token_96|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128105": {
- "content": "<|reserved_special_token_97|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128106": {
- "content": "<|reserved_special_token_98|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128107": {
- "content": "<|reserved_special_token_99|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128108": {
- "content": "<|reserved_special_token_100|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128109": {
- "content": "<|reserved_special_token_101|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128110": {
- "content": "<|reserved_special_token_102|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128111": {
- "content": "<|reserved_special_token_103|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128112": {
- "content": "<|reserved_special_token_104|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128113": {
- "content": "<|reserved_special_token_105|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128114": {
- "content": "<|reserved_special_token_106|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128115": {
- "content": "<|reserved_special_token_107|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128116": {
- "content": "<|reserved_special_token_108|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128117": {
- "content": "<|reserved_special_token_109|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128118": {
- "content": "<|reserved_special_token_110|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128119": {
- "content": "<|reserved_special_token_111|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128120": {
- "content": "<|reserved_special_token_112|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128121": {
- "content": "<|reserved_special_token_113|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128122": {
- "content": "<|reserved_special_token_114|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128123": {
- "content": "<|reserved_special_token_115|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128124": {
- "content": "<|reserved_special_token_116|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128125": {
- "content": "<|reserved_special_token_117|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128126": {
- "content": "<|reserved_special_token_118|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128127": {
- "content": "<|reserved_special_token_119|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128128": {
- "content": "<|reserved_special_token_120|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128129": {
- "content": "<|reserved_special_token_121|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128130": {
- "content": "<|reserved_special_token_122|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128131": {
- "content": "<|reserved_special_token_123|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128132": {
- "content": "<|reserved_special_token_124|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128133": {
- "content": "<|reserved_special_token_125|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128134": {
- "content": "<|reserved_special_token_126|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128135": {
- "content": "<|reserved_special_token_127|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128136": {
- "content": "<|reserved_special_token_128|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128137": {
- "content": "<|reserved_special_token_129|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128138": {
- "content": "<|reserved_special_token_130|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128139": {
- "content": "<|reserved_special_token_131|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128140": {
- "content": "<|reserved_special_token_132|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128141": {
- "content": "<|reserved_special_token_133|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128142": {
- "content": "<|reserved_special_token_134|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128143": {
- "content": "<|reserved_special_token_135|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128144": {
- "content": "<|reserved_special_token_136|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128145": {
- "content": "<|reserved_special_token_137|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128146": {
- "content": "<|reserved_special_token_138|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128147": {
- "content": "<|reserved_special_token_139|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128148": {
- "content": "<|reserved_special_token_140|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128149": {
- "content": "<|reserved_special_token_141|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128150": {
- "content": "<|reserved_special_token_142|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128151": {
- "content": "<|reserved_special_token_143|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128152": {
- "content": "<|reserved_special_token_144|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128153": {
- "content": "<|reserved_special_token_145|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128154": {
- "content": "<|reserved_special_token_146|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128155": {
- "content": "<|reserved_special_token_147|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128156": {
- "content": "<|reserved_special_token_148|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128157": {
- "content": "<|reserved_special_token_149|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128158": {
- "content": "<|reserved_special_token_150|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128159": {
- "content": "<|reserved_special_token_151|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128160": {
- "content": "<|reserved_special_token_152|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128161": {
- "content": "<|reserved_special_token_153|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128162": {
- "content": "<|reserved_special_token_154|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128163": {
- "content": "<|reserved_special_token_155|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128164": {
- "content": "<|reserved_special_token_156|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128165": {
- "content": "<|reserved_special_token_157|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128166": {
- "content": "<|reserved_special_token_158|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128167": {
- "content": "<|reserved_special_token_159|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128168": {
- "content": "<|reserved_special_token_160|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128169": {
- "content": "<|reserved_special_token_161|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128170": {
- "content": "<|reserved_special_token_162|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128171": {
- "content": "<|reserved_special_token_163|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128172": {
- "content": "<|reserved_special_token_164|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128173": {
- "content": "<|reserved_special_token_165|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128174": {
- "content": "<|reserved_special_token_166|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128175": {
- "content": "<|reserved_special_token_167|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128176": {
- "content": "<|reserved_special_token_168|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128177": {
- "content": "<|reserved_special_token_169|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128178": {
- "content": "<|reserved_special_token_170|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128179": {
- "content": "<|reserved_special_token_171|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128180": {
- "content": "<|reserved_special_token_172|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128181": {
- "content": "<|reserved_special_token_173|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128182": {
- "content": "<|reserved_special_token_174|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128183": {
- "content": "<|reserved_special_token_175|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128184": {
- "content": "<|reserved_special_token_176|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128185": {
- "content": "<|reserved_special_token_177|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128186": {
- "content": "<|reserved_special_token_178|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128187": {
- "content": "<|reserved_special_token_179|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128188": {
- "content": "<|reserved_special_token_180|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128189": {
- "content": "<|reserved_special_token_181|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128190": {
- "content": "<|reserved_special_token_182|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128191": {
- "content": "<|reserved_special_token_183|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128192": {
- "content": "<|reserved_special_token_184|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128193": {
- "content": "<|reserved_special_token_185|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128194": {
- "content": "<|reserved_special_token_186|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128195": {
- "content": "<|reserved_special_token_187|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128196": {
- "content": "<|reserved_special_token_188|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128197": {
- "content": "<|reserved_special_token_189|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128198": {
- "content": "<|reserved_special_token_190|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128199": {
- "content": "<|reserved_special_token_191|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128200": {
- "content": "<|reserved_special_token_192|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128201": {
- "content": "<|reserved_special_token_193|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128202": {
- "content": "<|reserved_special_token_194|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128203": {
- "content": "<|reserved_special_token_195|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128204": {
- "content": "<|reserved_special_token_196|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128205": {
- "content": "<|reserved_special_token_197|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128206": {
- "content": "<|reserved_special_token_198|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128207": {
- "content": "<|reserved_special_token_199|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128208": {
- "content": "<|reserved_special_token_200|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128209": {
- "content": "<|reserved_special_token_201|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128210": {
- "content": "<|reserved_special_token_202|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128211": {
- "content": "<|reserved_special_token_203|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128212": {
- "content": "<|reserved_special_token_204|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128213": {
- "content": "<|reserved_special_token_205|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128214": {
- "content": "<|reserved_special_token_206|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128215": {
- "content": "<|reserved_special_token_207|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128216": {
- "content": "<|reserved_special_token_208|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128217": {
- "content": "<|reserved_special_token_209|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128218": {
- "content": "<|reserved_special_token_210|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128219": {
- "content": "<|reserved_special_token_211|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128220": {
- "content": "<|reserved_special_token_212|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128221": {
- "content": "<|reserved_special_token_213|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128222": {
- "content": "<|reserved_special_token_214|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128223": {
- "content": "<|reserved_special_token_215|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128224": {
- "content": "<|reserved_special_token_216|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128225": {
- "content": "<|reserved_special_token_217|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128226": {
- "content": "<|reserved_special_token_218|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128227": {
- "content": "<|reserved_special_token_219|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128228": {
- "content": "<|reserved_special_token_220|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128229": {
- "content": "<|reserved_special_token_221|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128230": {
- "content": "<|reserved_special_token_222|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128231": {
- "content": "<|reserved_special_token_223|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128232": {
- "content": "<|reserved_special_token_224|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128233": {
- "content": "<|reserved_special_token_225|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128234": {
- "content": "<|reserved_special_token_226|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128235": {
- "content": "<|reserved_special_token_227|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128236": {
- "content": "<|reserved_special_token_228|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128237": {
- "content": "<|reserved_special_token_229|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128238": {
- "content": "<|reserved_special_token_230|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128239": {
- "content": "<|reserved_special_token_231|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128240": {
- "content": "<|reserved_special_token_232|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128241": {
- "content": "<|reserved_special_token_233|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128242": {
- "content": "<|reserved_special_token_234|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128243": {
- "content": "<|reserved_special_token_235|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128244": {
- "content": "<|reserved_special_token_236|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128245": {
- "content": "<|reserved_special_token_237|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128246": {
- "content": "<|reserved_special_token_238|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128247": {
- "content": "<|reserved_special_token_239|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128248": {
- "content": "<|reserved_special_token_240|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128249": {
- "content": "<|reserved_special_token_241|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128250": {
- "content": "<|reserved_special_token_242|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128251": {
- "content": "<|reserved_special_token_243|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128252": {
- "content": "<|reserved_special_token_244|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128253": {
- "content": "<|reserved_special_token_245|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128254": {
- "content": "<|reserved_special_token_246|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128255": {
- "content": "<|reserved_special_token_247|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- }
- },
- "bos_token": "<|begin_of_text|>",
- "clean_up_tokenization_spaces": true,
- "eos_token": "<|eot_id|>",
- "extra_special_tokens": {},
- "model_input_names": [
- "input_ids",
- "attention_mask"
- ],
- "model_max_length": 131072,
- "pad_token": "<|eot_id|>",
- "tokenizer_class": "PreTrainedTokenizerFast"
-}
diff --git a/checkpoint-400/trainer_state.json b/checkpoint-400/trainer_state.json
deleted file mode 100644
index 8536662e55d0228157dd159213a8d1ed7bf29eea..0000000000000000000000000000000000000000
--- a/checkpoint-400/trainer_state.json
+++ /dev/null
@@ -1,378 +0,0 @@
-{
- "best_global_step": 50,
- "best_metric": 0.7558398842811584,
- "best_model_checkpoint": null,
- "epoch": 40.0,
- "eval_steps": 50,
- "global_step": 400,
- "is_hyper_param_search": false,
- "is_local_process_zero": true,
- "is_world_process_zero": true,
- "log_history": [
- {
- "epoch": 1.0,
- "grad_norm": 1.4660576581954956,
- "learning_rate": 3.6e-05,
- "loss": 1.152,
- "step": 10
- },
- {
- "epoch": 2.0,
- "grad_norm": 0.8749533295631409,
- "learning_rate": 7.6e-05,
- "loss": 1.0421,
- "step": 20
- },
- {
- "epoch": 3.0,
- "grad_norm": 3.37060284614563,
- "learning_rate": 0.000116,
- "loss": 0.8539,
- "step": 30
- },
- {
- "epoch": 4.0,
- "grad_norm": 1.5355278253555298,
- "learning_rate": 0.00015600000000000002,
- "loss": 0.5483,
- "step": 40
- },
- {
- "epoch": 5.0,
- "grad_norm": 2.454838514328003,
- "learning_rate": 0.000196,
- "loss": 0.3736,
- "step": 50
- },
- {
- "epoch": 5.0,
- "eval_loss": 0.7558398842811584,
- "eval_runtime": 1.7227,
- "eval_samples_per_second": 2.902,
- "eval_steps_per_second": 2.902,
- "step": 50
- },
- {
- "epoch": 6.0,
- "grad_norm": 3.676417827606201,
- "learning_rate": 0.000196,
- "loss": 0.2291,
- "step": 60
- },
- {
- "epoch": 7.0,
- "grad_norm": 2.192375898361206,
- "learning_rate": 0.00019155555555555554,
- "loss": 0.1244,
- "step": 70
- },
- {
- "epoch": 8.0,
- "grad_norm": 2.630005359649658,
- "learning_rate": 0.00018711111111111112,
- "loss": 0.0862,
- "step": 80
- },
- {
- "epoch": 9.0,
- "grad_norm": 0.5021786093711853,
- "learning_rate": 0.00018266666666666667,
- "loss": 0.0614,
- "step": 90
- },
- {
- "epoch": 10.0,
- "grad_norm": 0.38170942664146423,
- "learning_rate": 0.00017822222222222222,
- "loss": 0.0471,
- "step": 100
- },
- {
- "epoch": 10.0,
- "eval_loss": 0.8806974291801453,
- "eval_runtime": 1.7764,
- "eval_samples_per_second": 2.815,
- "eval_steps_per_second": 2.815,
- "step": 100
- },
- {
- "epoch": 11.0,
- "grad_norm": 1.223647952079773,
- "learning_rate": 0.0001737777777777778,
- "loss": 0.0359,
- "step": 110
- },
- {
- "epoch": 12.0,
- "grad_norm": 0.5452818870544434,
- "learning_rate": 0.00016933333333333335,
- "loss": 0.0289,
- "step": 120
- },
- {
- "epoch": 13.0,
- "grad_norm": 0.19034886360168457,
- "learning_rate": 0.0001648888888888889,
- "loss": 0.029,
- "step": 130
- },
- {
- "epoch": 14.0,
- "grad_norm": 0.7483140230178833,
- "learning_rate": 0.00016044444444444445,
- "loss": 0.0247,
- "step": 140
- },
- {
- "epoch": 15.0,
- "grad_norm": 0.34800082445144653,
- "learning_rate": 0.00015600000000000002,
- "loss": 0.0193,
- "step": 150
- },
- {
- "epoch": 15.0,
- "eval_loss": 0.9916993379592896,
- "eval_runtime": 1.7667,
- "eval_samples_per_second": 2.83,
- "eval_steps_per_second": 2.83,
- "step": 150
- },
- {
- "epoch": 16.0,
- "grad_norm": 0.24237586557865143,
- "learning_rate": 0.00015155555555555557,
- "loss": 0.0176,
- "step": 160
- },
- {
- "epoch": 17.0,
- "grad_norm": 0.13607177138328552,
- "learning_rate": 0.00014711111111111112,
- "loss": 0.0131,
- "step": 170
- },
- {
- "epoch": 18.0,
- "grad_norm": 0.3655266761779785,
- "learning_rate": 0.00014266666666666667,
- "loss": 0.0164,
- "step": 180
- },
- {
- "epoch": 19.0,
- "grad_norm": 0.08258651196956635,
- "learning_rate": 0.00013822222222222222,
- "loss": 0.013,
- "step": 190
- },
- {
- "epoch": 20.0,
- "grad_norm": 0.1830163151025772,
- "learning_rate": 0.00013377777777777777,
- "loss": 0.0126,
- "step": 200
- },
- {
- "epoch": 20.0,
- "eval_loss": 1.0726474523544312,
- "eval_runtime": 1.7657,
- "eval_samples_per_second": 2.832,
- "eval_steps_per_second": 2.832,
- "step": 200
- },
- {
- "epoch": 21.0,
- "grad_norm": 0.12009257823228836,
- "learning_rate": 0.00012933333333333332,
- "loss": 0.0108,
- "step": 210
- },
- {
- "epoch": 22.0,
- "grad_norm": 0.1172371432185173,
- "learning_rate": 0.0001248888888888889,
- "loss": 0.0122,
- "step": 220
- },
- {
- "epoch": 23.0,
- "grad_norm": 0.14445751905441284,
- "learning_rate": 0.00012044444444444445,
- "loss": 0.0121,
- "step": 230
- },
- {
- "epoch": 24.0,
- "grad_norm": 0.18198293447494507,
- "learning_rate": 0.000116,
- "loss": 0.0128,
- "step": 240
- },
- {
- "epoch": 25.0,
- "grad_norm": 0.1562514454126358,
- "learning_rate": 0.00011155555555555556,
- "loss": 0.0117,
- "step": 250
- },
- {
- "epoch": 25.0,
- "eval_loss": 1.106227159500122,
- "eval_runtime": 1.7564,
- "eval_samples_per_second": 2.847,
- "eval_steps_per_second": 2.847,
- "step": 250
- },
- {
- "epoch": 26.0,
- "grad_norm": 0.06052432581782341,
- "learning_rate": 0.00010711111111111111,
- "loss": 0.0123,
- "step": 260
- },
- {
- "epoch": 27.0,
- "grad_norm": 0.03066837601363659,
- "learning_rate": 0.00010266666666666666,
- "loss": 0.0106,
- "step": 270
- },
- {
- "epoch": 28.0,
- "grad_norm": 0.034792304039001465,
- "learning_rate": 9.822222222222223e-05,
- "loss": 0.0124,
- "step": 280
- },
- {
- "epoch": 29.0,
- "grad_norm": 0.028368409723043442,
- "learning_rate": 9.377777777777779e-05,
- "loss": 0.0107,
- "step": 290
- },
- {
- "epoch": 30.0,
- "grad_norm": 0.03258921578526497,
- "learning_rate": 8.933333333333334e-05,
- "loss": 0.0109,
- "step": 300
- },
- {
- "epoch": 30.0,
- "eval_loss": 1.1306606531143188,
- "eval_runtime": 1.7675,
- "eval_samples_per_second": 2.829,
- "eval_steps_per_second": 2.829,
- "step": 300
- },
- {
- "epoch": 31.0,
- "grad_norm": 0.26905232667922974,
- "learning_rate": 8.488888888888889e-05,
- "loss": 0.0131,
- "step": 310
- },
- {
- "epoch": 32.0,
- "grad_norm": 0.15363195538520813,
- "learning_rate": 8.044444444444444e-05,
- "loss": 0.0121,
- "step": 320
- },
- {
- "epoch": 33.0,
- "grad_norm": 0.030869223177433014,
- "learning_rate": 7.6e-05,
- "loss": 0.0104,
- "step": 330
- },
- {
- "epoch": 34.0,
- "grad_norm": 0.07273676246404648,
- "learning_rate": 7.155555555555555e-05,
- "loss": 0.0112,
- "step": 340
- },
- {
- "epoch": 35.0,
- "grad_norm": 0.025629112496972084,
- "learning_rate": 6.711111111111112e-05,
- "loss": 0.0121,
- "step": 350
- },
- {
- "epoch": 35.0,
- "eval_loss": 1.128761887550354,
- "eval_runtime": 1.7518,
- "eval_samples_per_second": 2.854,
- "eval_steps_per_second": 2.854,
- "step": 350
- },
- {
- "epoch": 36.0,
- "grad_norm": 0.06929411739110947,
- "learning_rate": 6.266666666666667e-05,
- "loss": 0.0099,
- "step": 360
- },
- {
- "epoch": 37.0,
- "grad_norm": 0.102758027613163,
- "learning_rate": 5.8222222222222224e-05,
- "loss": 0.0096,
- "step": 370
- },
- {
- "epoch": 38.0,
- "grad_norm": 0.19261795282363892,
- "learning_rate": 5.377777777777778e-05,
- "loss": 0.0112,
- "step": 380
- },
- {
- "epoch": 39.0,
- "grad_norm": 0.23121486604213715,
- "learning_rate": 4.933333333333334e-05,
- "loss": 0.0117,
- "step": 390
- },
- {
- "epoch": 40.0,
- "grad_norm": 0.13266825675964355,
- "learning_rate": 4.4888888888888894e-05,
- "loss": 0.0113,
- "step": 400
- },
- {
- "epoch": 40.0,
- "eval_loss": 1.1694066524505615,
- "eval_runtime": 1.7708,
- "eval_samples_per_second": 2.824,
- "eval_steps_per_second": 2.824,
- "step": 400
- }
- ],
- "logging_steps": 10,
- "max_steps": 500,
- "num_input_tokens_seen": 0,
- "num_train_epochs": 50,
- "save_steps": 100,
- "stateful_callbacks": {
- "TrainerControl": {
- "args": {
- "should_epoch_stop": false,
- "should_evaluate": false,
- "should_log": false,
- "should_save": true,
- "should_training_stop": false
- },
- "attributes": {}
- }
- },
- "total_flos": 5.310201565544448e+16,
- "train_batch_size": 1,
- "trial_name": null,
- "trial_params": null
-}
diff --git a/checkpoint-400/training_args.bin b/checkpoint-400/training_args.bin
deleted file mode 100644
index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000
--- a/checkpoint-400/training_args.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f
-size 5777
diff --git a/checkpoint-500/README.md b/checkpoint-500/README.md
deleted file mode 100644
index da869e54abd54b0fea18dcc9516b16918f684370..0000000000000000000000000000000000000000
--- a/checkpoint-500/README.md
+++ /dev/null
@@ -1,207 +0,0 @@
----
-base_model: meta-llama/Llama-3.2-3B-Instruct
-library_name: peft
-pipeline_tag: text-generation
-tags:
-- base_model:adapter:meta-llama/Llama-3.2-3B-Instruct
-- lora
-- transformers
----
-
-# Model Card for Model ID
-
-
-
-
-
-## Model Details
-
-### Model Description
-
-
-
-
-
-- **Developed by:** [More Information Needed]
-- **Funded by [optional]:** [More Information Needed]
-- **Shared by [optional]:** [More Information Needed]
-- **Model type:** [More Information Needed]
-- **Language(s) (NLP):** [More Information Needed]
-- **License:** [More Information Needed]
-- **Finetuned from model [optional]:** [More Information Needed]
-
-### Model Sources [optional]
-
-
-
-- **Repository:** [More Information Needed]
-- **Paper [optional]:** [More Information Needed]
-- **Demo [optional]:** [More Information Needed]
-
-## Uses
-
-
-
-### Direct Use
-
-
-
-[More Information Needed]
-
-### Downstream Use [optional]
-
-
-
-[More Information Needed]
-
-### Out-of-Scope Use
-
-
-
-[More Information Needed]
-
-## Bias, Risks, and Limitations
-
-
-
-[More Information Needed]
-
-### Recommendations
-
-
-
-Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
-
-## How to Get Started with the Model
-
-Use the code below to get started with the model.
-
-[More Information Needed]
-
-## Training Details
-
-### Training Data
-
-
-
-[More Information Needed]
-
-### Training Procedure
-
-
-
-#### Preprocessing [optional]
-
-[More Information Needed]
-
-
-#### Training Hyperparameters
-
-- **Training regime:** [More Information Needed]
-
-#### Speeds, Sizes, Times [optional]
-
-
-
-[More Information Needed]
-
-## Evaluation
-
-
-
-### Testing Data, Factors & Metrics
-
-#### Testing Data
-
-
-
-[More Information Needed]
-
-#### Factors
-
-
-
-[More Information Needed]
-
-#### Metrics
-
-
-
-[More Information Needed]
-
-### Results
-
-[More Information Needed]
-
-#### Summary
-
-
-
-## Model Examination [optional]
-
-
-
-[More Information Needed]
-
-## Environmental Impact
-
-
-
-Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
-
-- **Hardware Type:** [More Information Needed]
-- **Hours used:** [More Information Needed]
-- **Cloud Provider:** [More Information Needed]
-- **Compute Region:** [More Information Needed]
-- **Carbon Emitted:** [More Information Needed]
-
-## Technical Specifications [optional]
-
-### Model Architecture and Objective
-
-[More Information Needed]
-
-### Compute Infrastructure
-
-[More Information Needed]
-
-#### Hardware
-
-[More Information Needed]
-
-#### Software
-
-[More Information Needed]
-
-## Citation [optional]
-
-
-
-**BibTeX:**
-
-[More Information Needed]
-
-**APA:**
-
-[More Information Needed]
-
-## Glossary [optional]
-
-
-
-[More Information Needed]
-
-## More Information [optional]
-
-[More Information Needed]
-
-## Model Card Authors [optional]
-
-[More Information Needed]
-
-## Model Card Contact
-
-[More Information Needed]
-### Framework versions
-
-- PEFT 0.17.1
\ No newline at end of file
diff --git a/checkpoint-500/adapter_config.json b/checkpoint-500/adapter_config.json
deleted file mode 100644
index c9a27d527a89fd0081c994e17bd2b908b8038d6e..0000000000000000000000000000000000000000
--- a/checkpoint-500/adapter_config.json
+++ /dev/null
@@ -1,42 +0,0 @@
-{
- "alpha_pattern": {},
- "auto_mapping": null,
- "base_model_name_or_path": "meta-llama/Llama-3.2-3B-Instruct",
- "bias": "none",
- "corda_config": null,
- "eva_config": null,
- "exclude_modules": null,
- "fan_in_fan_out": false,
- "inference_mode": true,
- "init_lora_weights": true,
- "layer_replication": null,
- "layers_pattern": null,
- "layers_to_transform": null,
- "loftq_config": {},
- "lora_alpha": 32,
- "lora_bias": false,
- "lora_dropout": 0.1,
- "megatron_config": null,
- "megatron_core": "megatron.core",
- "modules_to_save": null,
- "peft_type": "LORA",
- "qalora_group_size": 16,
- "r": 16,
- "rank_pattern": {},
- "revision": null,
- "target_modules": [
- "down_proj",
- "v_proj",
- "q_proj",
- "k_proj",
- "gate_proj",
- "o_proj",
- "up_proj"
- ],
- "target_parameters": null,
- "task_type": "CAUSAL_LM",
- "trainable_token_indices": null,
- "use_dora": false,
- "use_qalora": false,
- "use_rslora": false
-}
\ No newline at end of file
diff --git a/checkpoint-500/adapter_model.safetensors b/checkpoint-500/adapter_model.safetensors
deleted file mode 100644
index 7a9846a96572118b10e28d68186ff4d9910f14c8..0000000000000000000000000000000000000000
--- a/checkpoint-500/adapter_model.safetensors
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f1267898d59499b11e00e1bb133bce956e6ae4d0f5e56bc474251ec2c869df0e
-size 97307544
diff --git a/checkpoint-500/chat_template.jinja b/checkpoint-500/chat_template.jinja
deleted file mode 100644
index 1bad6a0f648dccdbec523ca79ba90fbcfc806af0..0000000000000000000000000000000000000000
--- a/checkpoint-500/chat_template.jinja
+++ /dev/null
@@ -1,93 +0,0 @@
-{{- bos_token }}
-{%- if custom_tools is defined %}
- {%- set tools = custom_tools %}
-{%- endif %}
-{%- if not tools_in_user_message is defined %}
- {%- set tools_in_user_message = true %}
-{%- endif %}
-{%- if not date_string is defined %}
- {%- if strftime_now is defined %}
- {%- set date_string = strftime_now("%d %b %Y") %}
- {%- else %}
- {%- set date_string = "26 Jul 2024" %}
- {%- endif %}
-{%- endif %}
-{%- if not tools is defined %}
- {%- set tools = none %}
-{%- endif %}
-
-{#- This block extracts the system message, so we can slot it into the right place. #}
-{%- if messages[0]['role'] == 'system' %}
- {%- set system_message = messages[0]['content']|trim %}
- {%- set messages = messages[1:] %}
-{%- else %}
- {%- set system_message = "" %}
-{%- endif %}
-
-{#- System message #}
-{{- "<|start_header_id|>system<|end_header_id|>\n\n" }}
-{%- if tools is not none %}
- {{- "Environment: ipython\n" }}
-{%- endif %}
-{{- "Cutting Knowledge Date: December 2023\n" }}
-{{- "Today Date: " + date_string + "\n\n" }}
-{%- if tools is not none and not tools_in_user_message %}
- {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }}
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
- {{- "Do not use variables.\n\n" }}
- {%- for t in tools %}
- {{- t | tojson(indent=4) }}
- {{- "\n\n" }}
- {%- endfor %}
-{%- endif %}
-{{- system_message }}
-{{- "<|eot_id|>" }}
-
-{#- Custom tools are passed in a user message with some extra guidance #}
-{%- if tools_in_user_message and not tools is none %}
- {#- Extract the first user message so we can plug it in here #}
- {%- if messages | length != 0 %}
- {%- set first_user_message = messages[0]['content']|trim %}
- {%- set messages = messages[1:] %}
- {%- else %}
- {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }}
-{%- endif %}
- {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}
- {{- "Given the following functions, please respond with a JSON for a function call " }}
- {{- "with its proper arguments that best answers the given prompt.\n\n" }}
- {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }}
- {{- "Do not use variables.\n\n" }}
- {%- for t in tools %}
- {{- t | tojson(indent=4) }}
- {{- "\n\n" }}
- {%- endfor %}
- {{- first_user_message + "<|eot_id|>"}}
-{%- endif %}
-
-{%- for message in messages %}
- {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}
- {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }}
- {%- elif 'tool_calls' in message %}
- {%- if not message.tool_calls|length == 1 %}
- {{- raise_exception("This model only supports single tool-calls at once!") }}
- {%- endif %}
- {%- set tool_call = message.tool_calls[0].function %}
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}
- {{- '{"name": "' + tool_call.name + '", ' }}
- {{- '"parameters": ' }}
- {{- tool_call.arguments | tojson }}
- {{- "}" }}
- {{- "<|eot_id|>" }}
- {%- elif message.role == "tool" or message.role == "ipython" %}
- {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }}
- {%- if message.content is mapping or message.content is iterable %}
- {{- message.content | tojson }}
- {%- else %}
- {{- message.content }}
- {%- endif %}
- {{- "<|eot_id|>" }}
- {%- endif %}
-{%- endfor %}
-{%- if add_generation_prompt %}
- {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}
-{%- endif %}
diff --git a/checkpoint-500/optimizer.pt b/checkpoint-500/optimizer.pt
deleted file mode 100644
index f7c2398a130ab9ffd8b90defabe5571440bc8cc1..0000000000000000000000000000000000000000
--- a/checkpoint-500/optimizer.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:364e4794f5e5265e6208ffb91534397b3f81c0ffd11eb1f70e677b82917cd811
-size 194846331
diff --git a/checkpoint-500/rng_state.pth b/checkpoint-500/rng_state.pth
deleted file mode 100644
index 1ba3c4495fdbd5b478e34246759af0e667a57976..0000000000000000000000000000000000000000
--- a/checkpoint-500/rng_state.pth
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:cbf17c6ea5a2364f5c121447c9554bb3437ed12ac00bd180e0c39823e3932887
-size 14645
diff --git a/checkpoint-500/scaler.pt b/checkpoint-500/scaler.pt
deleted file mode 100644
index 86c857e8514e5db52a765434b135695dac4c9c36..0000000000000000000000000000000000000000
--- a/checkpoint-500/scaler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f77569c2e850b04af982cc8c1389f1430851448915c593b69e5da36ce05b71d7
-size 1383
diff --git a/checkpoint-500/scheduler.pt b/checkpoint-500/scheduler.pt
deleted file mode 100644
index 7d406056d4209a0bc88bb800efa5129731063e3b..0000000000000000000000000000000000000000
--- a/checkpoint-500/scheduler.pt
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:5fc3f7ed409df14d1c62e690e63b0c5e5d89499208bb0e61ef44ccedc3f1d40a
-size 1465
diff --git a/checkpoint-500/special_tokens_map.json b/checkpoint-500/special_tokens_map.json
deleted file mode 100644
index b43be96621d147110fb8a18b5776ec6e38516127..0000000000000000000000000000000000000000
--- a/checkpoint-500/special_tokens_map.json
+++ /dev/null
@@ -1,17 +0,0 @@
-{
- "bos_token": {
- "content": "<|begin_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "eos_token": {
- "content": "<|eot_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "pad_token": "<|eot_id|>"
-}
diff --git a/checkpoint-500/tokenizer.json b/checkpoint-500/tokenizer.json
deleted file mode 100644
index 8e89913d63cf04862fcbf301032ee349780489f2..0000000000000000000000000000000000000000
--- a/checkpoint-500/tokenizer.json
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:912e72517f7521f3273166a7879fe54c52b397f8c48ea80f8f1ed794beb24c09
-size 17210184
diff --git a/checkpoint-500/tokenizer_config.json b/checkpoint-500/tokenizer_config.json
deleted file mode 100644
index 3beeacc86a6ca3cae14ad3004263ab74a4bac07a..0000000000000000000000000000000000000000
--- a/checkpoint-500/tokenizer_config.json
+++ /dev/null
@@ -1,2063 +0,0 @@
-{
- "added_tokens_decoder": {
- "128000": {
- "content": "<|begin_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128001": {
- "content": "<|end_of_text|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128002": {
- "content": "<|reserved_special_token_0|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128003": {
- "content": "<|reserved_special_token_1|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128004": {
- "content": "<|finetune_right_pad_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128005": {
- "content": "<|reserved_special_token_2|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128006": {
- "content": "<|start_header_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128007": {
- "content": "<|end_header_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128008": {
- "content": "<|eom_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128009": {
- "content": "<|eot_id|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128010": {
- "content": "<|python_tag|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128011": {
- "content": "<|reserved_special_token_3|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128012": {
- "content": "<|reserved_special_token_4|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128013": {
- "content": "<|reserved_special_token_5|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128014": {
- "content": "<|reserved_special_token_6|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128015": {
- "content": "<|reserved_special_token_7|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128016": {
- "content": "<|reserved_special_token_8|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128017": {
- "content": "<|reserved_special_token_9|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128018": {
- "content": "<|reserved_special_token_10|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128019": {
- "content": "<|reserved_special_token_11|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128020": {
- "content": "<|reserved_special_token_12|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128021": {
- "content": "<|reserved_special_token_13|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128022": {
- "content": "<|reserved_special_token_14|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128023": {
- "content": "<|reserved_special_token_15|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128024": {
- "content": "<|reserved_special_token_16|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128025": {
- "content": "<|reserved_special_token_17|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128026": {
- "content": "<|reserved_special_token_18|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128027": {
- "content": "<|reserved_special_token_19|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128028": {
- "content": "<|reserved_special_token_20|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128029": {
- "content": "<|reserved_special_token_21|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128030": {
- "content": "<|reserved_special_token_22|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128031": {
- "content": "<|reserved_special_token_23|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128032": {
- "content": "<|reserved_special_token_24|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128033": {
- "content": "<|reserved_special_token_25|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128034": {
- "content": "<|reserved_special_token_26|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128035": {
- "content": "<|reserved_special_token_27|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128036": {
- "content": "<|reserved_special_token_28|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128037": {
- "content": "<|reserved_special_token_29|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128038": {
- "content": "<|reserved_special_token_30|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128039": {
- "content": "<|reserved_special_token_31|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128040": {
- "content": "<|reserved_special_token_32|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128041": {
- "content": "<|reserved_special_token_33|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128042": {
- "content": "<|reserved_special_token_34|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128043": {
- "content": "<|reserved_special_token_35|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128044": {
- "content": "<|reserved_special_token_36|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128045": {
- "content": "<|reserved_special_token_37|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128046": {
- "content": "<|reserved_special_token_38|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128047": {
- "content": "<|reserved_special_token_39|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128048": {
- "content": "<|reserved_special_token_40|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128049": {
- "content": "<|reserved_special_token_41|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128050": {
- "content": "<|reserved_special_token_42|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128051": {
- "content": "<|reserved_special_token_43|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128052": {
- "content": "<|reserved_special_token_44|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128053": {
- "content": "<|reserved_special_token_45|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128054": {
- "content": "<|reserved_special_token_46|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128055": {
- "content": "<|reserved_special_token_47|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128056": {
- "content": "<|reserved_special_token_48|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128057": {
- "content": "<|reserved_special_token_49|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128058": {
- "content": "<|reserved_special_token_50|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128059": {
- "content": "<|reserved_special_token_51|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128060": {
- "content": "<|reserved_special_token_52|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128061": {
- "content": "<|reserved_special_token_53|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128062": {
- "content": "<|reserved_special_token_54|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128063": {
- "content": "<|reserved_special_token_55|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128064": {
- "content": "<|reserved_special_token_56|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128065": {
- "content": "<|reserved_special_token_57|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128066": {
- "content": "<|reserved_special_token_58|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128067": {
- "content": "<|reserved_special_token_59|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128068": {
- "content": "<|reserved_special_token_60|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128069": {
- "content": "<|reserved_special_token_61|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128070": {
- "content": "<|reserved_special_token_62|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128071": {
- "content": "<|reserved_special_token_63|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128072": {
- "content": "<|reserved_special_token_64|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128073": {
- "content": "<|reserved_special_token_65|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128074": {
- "content": "<|reserved_special_token_66|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128075": {
- "content": "<|reserved_special_token_67|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128076": {
- "content": "<|reserved_special_token_68|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128077": {
- "content": "<|reserved_special_token_69|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128078": {
- "content": "<|reserved_special_token_70|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128079": {
- "content": "<|reserved_special_token_71|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128080": {
- "content": "<|reserved_special_token_72|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128081": {
- "content": "<|reserved_special_token_73|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128082": {
- "content": "<|reserved_special_token_74|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128083": {
- "content": "<|reserved_special_token_75|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128084": {
- "content": "<|reserved_special_token_76|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128085": {
- "content": "<|reserved_special_token_77|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128086": {
- "content": "<|reserved_special_token_78|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128087": {
- "content": "<|reserved_special_token_79|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128088": {
- "content": "<|reserved_special_token_80|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128089": {
- "content": "<|reserved_special_token_81|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128090": {
- "content": "<|reserved_special_token_82|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128091": {
- "content": "<|reserved_special_token_83|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128092": {
- "content": "<|reserved_special_token_84|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128093": {
- "content": "<|reserved_special_token_85|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128094": {
- "content": "<|reserved_special_token_86|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128095": {
- "content": "<|reserved_special_token_87|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128096": {
- "content": "<|reserved_special_token_88|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128097": {
- "content": "<|reserved_special_token_89|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128098": {
- "content": "<|reserved_special_token_90|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128099": {
- "content": "<|reserved_special_token_91|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128100": {
- "content": "<|reserved_special_token_92|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128101": {
- "content": "<|reserved_special_token_93|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128102": {
- "content": "<|reserved_special_token_94|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128103": {
- "content": "<|reserved_special_token_95|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128104": {
- "content": "<|reserved_special_token_96|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128105": {
- "content": "<|reserved_special_token_97|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128106": {
- "content": "<|reserved_special_token_98|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128107": {
- "content": "<|reserved_special_token_99|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128108": {
- "content": "<|reserved_special_token_100|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128109": {
- "content": "<|reserved_special_token_101|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128110": {
- "content": "<|reserved_special_token_102|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128111": {
- "content": "<|reserved_special_token_103|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128112": {
- "content": "<|reserved_special_token_104|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128113": {
- "content": "<|reserved_special_token_105|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128114": {
- "content": "<|reserved_special_token_106|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128115": {
- "content": "<|reserved_special_token_107|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128116": {
- "content": "<|reserved_special_token_108|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128117": {
- "content": "<|reserved_special_token_109|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128118": {
- "content": "<|reserved_special_token_110|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128119": {
- "content": "<|reserved_special_token_111|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128120": {
- "content": "<|reserved_special_token_112|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128121": {
- "content": "<|reserved_special_token_113|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128122": {
- "content": "<|reserved_special_token_114|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128123": {
- "content": "<|reserved_special_token_115|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128124": {
- "content": "<|reserved_special_token_116|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128125": {
- "content": "<|reserved_special_token_117|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128126": {
- "content": "<|reserved_special_token_118|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128127": {
- "content": "<|reserved_special_token_119|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128128": {
- "content": "<|reserved_special_token_120|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128129": {
- "content": "<|reserved_special_token_121|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128130": {
- "content": "<|reserved_special_token_122|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128131": {
- "content": "<|reserved_special_token_123|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128132": {
- "content": "<|reserved_special_token_124|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128133": {
- "content": "<|reserved_special_token_125|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128134": {
- "content": "<|reserved_special_token_126|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128135": {
- "content": "<|reserved_special_token_127|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128136": {
- "content": "<|reserved_special_token_128|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128137": {
- "content": "<|reserved_special_token_129|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128138": {
- "content": "<|reserved_special_token_130|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128139": {
- "content": "<|reserved_special_token_131|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128140": {
- "content": "<|reserved_special_token_132|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128141": {
- "content": "<|reserved_special_token_133|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128142": {
- "content": "<|reserved_special_token_134|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128143": {
- "content": "<|reserved_special_token_135|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128144": {
- "content": "<|reserved_special_token_136|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128145": {
- "content": "<|reserved_special_token_137|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128146": {
- "content": "<|reserved_special_token_138|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128147": {
- "content": "<|reserved_special_token_139|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128148": {
- "content": "<|reserved_special_token_140|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128149": {
- "content": "<|reserved_special_token_141|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128150": {
- "content": "<|reserved_special_token_142|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128151": {
- "content": "<|reserved_special_token_143|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128152": {
- "content": "<|reserved_special_token_144|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128153": {
- "content": "<|reserved_special_token_145|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128154": {
- "content": "<|reserved_special_token_146|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128155": {
- "content": "<|reserved_special_token_147|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128156": {
- "content": "<|reserved_special_token_148|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128157": {
- "content": "<|reserved_special_token_149|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128158": {
- "content": "<|reserved_special_token_150|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128159": {
- "content": "<|reserved_special_token_151|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128160": {
- "content": "<|reserved_special_token_152|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128161": {
- "content": "<|reserved_special_token_153|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128162": {
- "content": "<|reserved_special_token_154|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128163": {
- "content": "<|reserved_special_token_155|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128164": {
- "content": "<|reserved_special_token_156|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128165": {
- "content": "<|reserved_special_token_157|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128166": {
- "content": "<|reserved_special_token_158|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128167": {
- "content": "<|reserved_special_token_159|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128168": {
- "content": "<|reserved_special_token_160|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128169": {
- "content": "<|reserved_special_token_161|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128170": {
- "content": "<|reserved_special_token_162|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128171": {
- "content": "<|reserved_special_token_163|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128172": {
- "content": "<|reserved_special_token_164|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128173": {
- "content": "<|reserved_special_token_165|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128174": {
- "content": "<|reserved_special_token_166|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128175": {
- "content": "<|reserved_special_token_167|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128176": {
- "content": "<|reserved_special_token_168|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128177": {
- "content": "<|reserved_special_token_169|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128178": {
- "content": "<|reserved_special_token_170|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128179": {
- "content": "<|reserved_special_token_171|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128180": {
- "content": "<|reserved_special_token_172|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128181": {
- "content": "<|reserved_special_token_173|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128182": {
- "content": "<|reserved_special_token_174|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128183": {
- "content": "<|reserved_special_token_175|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128184": {
- "content": "<|reserved_special_token_176|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128185": {
- "content": "<|reserved_special_token_177|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128186": {
- "content": "<|reserved_special_token_178|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128187": {
- "content": "<|reserved_special_token_179|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128188": {
- "content": "<|reserved_special_token_180|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128189": {
- "content": "<|reserved_special_token_181|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128190": {
- "content": "<|reserved_special_token_182|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128191": {
- "content": "<|reserved_special_token_183|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128192": {
- "content": "<|reserved_special_token_184|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128193": {
- "content": "<|reserved_special_token_185|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128194": {
- "content": "<|reserved_special_token_186|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128195": {
- "content": "<|reserved_special_token_187|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128196": {
- "content": "<|reserved_special_token_188|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128197": {
- "content": "<|reserved_special_token_189|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128198": {
- "content": "<|reserved_special_token_190|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128199": {
- "content": "<|reserved_special_token_191|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128200": {
- "content": "<|reserved_special_token_192|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128201": {
- "content": "<|reserved_special_token_193|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128202": {
- "content": "<|reserved_special_token_194|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128203": {
- "content": "<|reserved_special_token_195|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128204": {
- "content": "<|reserved_special_token_196|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128205": {
- "content": "<|reserved_special_token_197|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128206": {
- "content": "<|reserved_special_token_198|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128207": {
- "content": "<|reserved_special_token_199|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128208": {
- "content": "<|reserved_special_token_200|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128209": {
- "content": "<|reserved_special_token_201|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128210": {
- "content": "<|reserved_special_token_202|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128211": {
- "content": "<|reserved_special_token_203|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128212": {
- "content": "<|reserved_special_token_204|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128213": {
- "content": "<|reserved_special_token_205|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128214": {
- "content": "<|reserved_special_token_206|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128215": {
- "content": "<|reserved_special_token_207|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128216": {
- "content": "<|reserved_special_token_208|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128217": {
- "content": "<|reserved_special_token_209|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128218": {
- "content": "<|reserved_special_token_210|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128219": {
- "content": "<|reserved_special_token_211|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128220": {
- "content": "<|reserved_special_token_212|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128221": {
- "content": "<|reserved_special_token_213|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128222": {
- "content": "<|reserved_special_token_214|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128223": {
- "content": "<|reserved_special_token_215|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128224": {
- "content": "<|reserved_special_token_216|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128225": {
- "content": "<|reserved_special_token_217|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128226": {
- "content": "<|reserved_special_token_218|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128227": {
- "content": "<|reserved_special_token_219|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128228": {
- "content": "<|reserved_special_token_220|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128229": {
- "content": "<|reserved_special_token_221|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128230": {
- "content": "<|reserved_special_token_222|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128231": {
- "content": "<|reserved_special_token_223|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128232": {
- "content": "<|reserved_special_token_224|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128233": {
- "content": "<|reserved_special_token_225|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128234": {
- "content": "<|reserved_special_token_226|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128235": {
- "content": "<|reserved_special_token_227|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128236": {
- "content": "<|reserved_special_token_228|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128237": {
- "content": "<|reserved_special_token_229|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128238": {
- "content": "<|reserved_special_token_230|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128239": {
- "content": "<|reserved_special_token_231|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128240": {
- "content": "<|reserved_special_token_232|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128241": {
- "content": "<|reserved_special_token_233|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128242": {
- "content": "<|reserved_special_token_234|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128243": {
- "content": "<|reserved_special_token_235|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128244": {
- "content": "<|reserved_special_token_236|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128245": {
- "content": "<|reserved_special_token_237|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128246": {
- "content": "<|reserved_special_token_238|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128247": {
- "content": "<|reserved_special_token_239|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128248": {
- "content": "<|reserved_special_token_240|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128249": {
- "content": "<|reserved_special_token_241|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128250": {
- "content": "<|reserved_special_token_242|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128251": {
- "content": "<|reserved_special_token_243|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128252": {
- "content": "<|reserved_special_token_244|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128253": {
- "content": "<|reserved_special_token_245|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128254": {
- "content": "<|reserved_special_token_246|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "128255": {
- "content": "<|reserved_special_token_247|>",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- }
- },
- "bos_token": "<|begin_of_text|>",
- "clean_up_tokenization_spaces": true,
- "eos_token": "<|eot_id|>",
- "extra_special_tokens": {},
- "model_input_names": [
- "input_ids",
- "attention_mask"
- ],
- "model_max_length": 131072,
- "pad_token": "<|eot_id|>",
- "tokenizer_class": "PreTrainedTokenizerFast"
-}
diff --git a/checkpoint-500/trainer_state.json b/checkpoint-500/trainer_state.json
deleted file mode 100644
index ad1084b0a242485512b68bd91bce462e02c2d094..0000000000000000000000000000000000000000
--- a/checkpoint-500/trainer_state.json
+++ /dev/null
@@ -1,464 +0,0 @@
-{
- "best_global_step": 50,
- "best_metric": 0.7558398842811584,
- "best_model_checkpoint": null,
- "epoch": 50.0,
- "eval_steps": 50,
- "global_step": 500,
- "is_hyper_param_search": false,
- "is_local_process_zero": true,
- "is_world_process_zero": true,
- "log_history": [
- {
- "epoch": 1.0,
- "grad_norm": 1.4660576581954956,
- "learning_rate": 3.6e-05,
- "loss": 1.152,
- "step": 10
- },
- {
- "epoch": 2.0,
- "grad_norm": 0.8749533295631409,
- "learning_rate": 7.6e-05,
- "loss": 1.0421,
- "step": 20
- },
- {
- "epoch": 3.0,
- "grad_norm": 3.37060284614563,
- "learning_rate": 0.000116,
- "loss": 0.8539,
- "step": 30
- },
- {
- "epoch": 4.0,
- "grad_norm": 1.5355278253555298,
- "learning_rate": 0.00015600000000000002,
- "loss": 0.5483,
- "step": 40
- },
- {
- "epoch": 5.0,
- "grad_norm": 2.454838514328003,
- "learning_rate": 0.000196,
- "loss": 0.3736,
- "step": 50
- },
- {
- "epoch": 5.0,
- "eval_loss": 0.7558398842811584,
- "eval_runtime": 1.7227,
- "eval_samples_per_second": 2.902,
- "eval_steps_per_second": 2.902,
- "step": 50
- },
- {
- "epoch": 6.0,
- "grad_norm": 3.676417827606201,
- "learning_rate": 0.000196,
- "loss": 0.2291,
- "step": 60
- },
- {
- "epoch": 7.0,
- "grad_norm": 2.192375898361206,
- "learning_rate": 0.00019155555555555554,
- "loss": 0.1244,
- "step": 70
- },
- {
- "epoch": 8.0,
- "grad_norm": 2.630005359649658,
- "learning_rate": 0.00018711111111111112,
- "loss": 0.0862,
- "step": 80
- },
- {
- "epoch": 9.0,
- "grad_norm": 0.5021786093711853,
- "learning_rate": 0.00018266666666666667,
- "loss": 0.0614,
- "step": 90
- },
- {
- "epoch": 10.0,
- "grad_norm": 0.38170942664146423,
- "learning_rate": 0.00017822222222222222,
- "loss": 0.0471,
- "step": 100
- },
- {
- "epoch": 10.0,
- "eval_loss": 0.8806974291801453,
- "eval_runtime": 1.7764,
- "eval_samples_per_second": 2.815,
- "eval_steps_per_second": 2.815,
- "step": 100
- },
- {
- "epoch": 11.0,
- "grad_norm": 1.223647952079773,
- "learning_rate": 0.0001737777777777778,
- "loss": 0.0359,
- "step": 110
- },
- {
- "epoch": 12.0,
- "grad_norm": 0.5452818870544434,
- "learning_rate": 0.00016933333333333335,
- "loss": 0.0289,
- "step": 120
- },
- {
- "epoch": 13.0,
- "grad_norm": 0.19034886360168457,
- "learning_rate": 0.0001648888888888889,
- "loss": 0.029,
- "step": 130
- },
- {
- "epoch": 14.0,
- "grad_norm": 0.7483140230178833,
- "learning_rate": 0.00016044444444444445,
- "loss": 0.0247,
- "step": 140
- },
- {
- "epoch": 15.0,
- "grad_norm": 0.34800082445144653,
- "learning_rate": 0.00015600000000000002,
- "loss": 0.0193,
- "step": 150
- },
- {
- "epoch": 15.0,
- "eval_loss": 0.9916993379592896,
- "eval_runtime": 1.7667,
- "eval_samples_per_second": 2.83,
- "eval_steps_per_second": 2.83,
- "step": 150
- },
- {
- "epoch": 16.0,
- "grad_norm": 0.24237586557865143,
- "learning_rate": 0.00015155555555555557,
- "loss": 0.0176,
- "step": 160
- },
- {
- "epoch": 17.0,
- "grad_norm": 0.13607177138328552,
- "learning_rate": 0.00014711111111111112,
- "loss": 0.0131,
- "step": 170
- },
- {
- "epoch": 18.0,
- "grad_norm": 0.3655266761779785,
- "learning_rate": 0.00014266666666666667,
- "loss": 0.0164,
- "step": 180
- },
- {
- "epoch": 19.0,
- "grad_norm": 0.08258651196956635,
- "learning_rate": 0.00013822222222222222,
- "loss": 0.013,
- "step": 190
- },
- {
- "epoch": 20.0,
- "grad_norm": 0.1830163151025772,
- "learning_rate": 0.00013377777777777777,
- "loss": 0.0126,
- "step": 200
- },
- {
- "epoch": 20.0,
- "eval_loss": 1.0726474523544312,
- "eval_runtime": 1.7657,
- "eval_samples_per_second": 2.832,
- "eval_steps_per_second": 2.832,
- "step": 200
- },
- {
- "epoch": 21.0,
- "grad_norm": 0.12009257823228836,
- "learning_rate": 0.00012933333333333332,
- "loss": 0.0108,
- "step": 210
- },
- {
- "epoch": 22.0,
- "grad_norm": 0.1172371432185173,
- "learning_rate": 0.0001248888888888889,
- "loss": 0.0122,
- "step": 220
- },
- {
- "epoch": 23.0,
- "grad_norm": 0.14445751905441284,
- "learning_rate": 0.00012044444444444445,
- "loss": 0.0121,
- "step": 230
- },
- {
- "epoch": 24.0,
- "grad_norm": 0.18198293447494507,
- "learning_rate": 0.000116,
- "loss": 0.0128,
- "step": 240
- },
- {
- "epoch": 25.0,
- "grad_norm": 0.1562514454126358,
- "learning_rate": 0.00011155555555555556,
- "loss": 0.0117,
- "step": 250
- },
- {
- "epoch": 25.0,
- "eval_loss": 1.106227159500122,
- "eval_runtime": 1.7564,
- "eval_samples_per_second": 2.847,
- "eval_steps_per_second": 2.847,
- "step": 250
- },
- {
- "epoch": 26.0,
- "grad_norm": 0.06052432581782341,
- "learning_rate": 0.00010711111111111111,
- "loss": 0.0123,
- "step": 260
- },
- {
- "epoch": 27.0,
- "grad_norm": 0.03066837601363659,
- "learning_rate": 0.00010266666666666666,
- "loss": 0.0106,
- "step": 270
- },
- {
- "epoch": 28.0,
- "grad_norm": 0.034792304039001465,
- "learning_rate": 9.822222222222223e-05,
- "loss": 0.0124,
- "step": 280
- },
- {
- "epoch": 29.0,
- "grad_norm": 0.028368409723043442,
- "learning_rate": 9.377777777777779e-05,
- "loss": 0.0107,
- "step": 290
- },
- {
- "epoch": 30.0,
- "grad_norm": 0.03258921578526497,
- "learning_rate": 8.933333333333334e-05,
- "loss": 0.0109,
- "step": 300
- },
- {
- "epoch": 30.0,
- "eval_loss": 1.1306606531143188,
- "eval_runtime": 1.7675,
- "eval_samples_per_second": 2.829,
- "eval_steps_per_second": 2.829,
- "step": 300
- },
- {
- "epoch": 31.0,
- "grad_norm": 0.26905232667922974,
- "learning_rate": 8.488888888888889e-05,
- "loss": 0.0131,
- "step": 310
- },
- {
- "epoch": 32.0,
- "grad_norm": 0.15363195538520813,
- "learning_rate": 8.044444444444444e-05,
- "loss": 0.0121,
- "step": 320
- },
- {
- "epoch": 33.0,
- "grad_norm": 0.030869223177433014,
- "learning_rate": 7.6e-05,
- "loss": 0.0104,
- "step": 330
- },
- {
- "epoch": 34.0,
- "grad_norm": 0.07273676246404648,
- "learning_rate": 7.155555555555555e-05,
- "loss": 0.0112,
- "step": 340
- },
- {
- "epoch": 35.0,
- "grad_norm": 0.025629112496972084,
- "learning_rate": 6.711111111111112e-05,
- "loss": 0.0121,
- "step": 350
- },
- {
- "epoch": 35.0,
- "eval_loss": 1.128761887550354,
- "eval_runtime": 1.7518,
- "eval_samples_per_second": 2.854,
- "eval_steps_per_second": 2.854,
- "step": 350
- },
- {
- "epoch": 36.0,
- "grad_norm": 0.06929411739110947,
- "learning_rate": 6.266666666666667e-05,
- "loss": 0.0099,
- "step": 360
- },
- {
- "epoch": 37.0,
- "grad_norm": 0.102758027613163,
- "learning_rate": 5.8222222222222224e-05,
- "loss": 0.0096,
- "step": 370
- },
- {
- "epoch": 38.0,
- "grad_norm": 0.19261795282363892,
- "learning_rate": 5.377777777777778e-05,
- "loss": 0.0112,
- "step": 380
- },
- {
- "epoch": 39.0,
- "grad_norm": 0.23121486604213715,
- "learning_rate": 4.933333333333334e-05,
- "loss": 0.0117,
- "step": 390
- },
- {
- "epoch": 40.0,
- "grad_norm": 0.13266825675964355,
- "learning_rate": 4.4888888888888894e-05,
- "loss": 0.0113,
- "step": 400
- },
- {
- "epoch": 40.0,
- "eval_loss": 1.1694066524505615,
- "eval_runtime": 1.7708,
- "eval_samples_per_second": 2.824,
- "eval_steps_per_second": 2.824,
- "step": 400
- },
- {
- "epoch": 41.0,
- "grad_norm": 0.17276649177074432,
- "learning_rate": 4.0444444444444444e-05,
- "loss": 0.0103,
- "step": 410
- },
- {
- "epoch": 42.0,
- "grad_norm": 0.13706862926483154,
- "learning_rate": 3.6e-05,
- "loss": 0.0115,
- "step": 420
- },
- {
- "epoch": 43.0,
- "grad_norm": 0.1022062748670578,
- "learning_rate": 3.155555555555556e-05,
- "loss": 0.0118,
- "step": 430
- },
- {
- "epoch": 44.0,
- "grad_norm": 0.11416096985340118,
- "learning_rate": 2.7111111111111114e-05,
- "loss": 0.0096,
- "step": 440
- },
- {
- "epoch": 45.0,
- "grad_norm": 0.14480136334896088,
- "learning_rate": 2.2666666666666668e-05,
- "loss": 0.0093,
- "step": 450
- },
- {
- "epoch": 45.0,
- "eval_loss": 1.1621501445770264,
- "eval_runtime": 1.7753,
- "eval_samples_per_second": 2.816,
- "eval_steps_per_second": 2.816,
- "step": 450
- },
- {
- "epoch": 46.0,
- "grad_norm": 0.1180804893374443,
- "learning_rate": 1.8222222222222224e-05,
- "loss": 0.0126,
- "step": 460
- },
- {
- "epoch": 47.0,
- "grad_norm": 0.05086653307080269,
- "learning_rate": 1.3777777777777778e-05,
- "loss": 0.0111,
- "step": 470
- },
- {
- "epoch": 48.0,
- "grad_norm": 0.032583802938461304,
- "learning_rate": 9.333333333333334e-06,
- "loss": 0.0094,
- "step": 480
- },
- {
- "epoch": 49.0,
- "grad_norm": 0.04545021802186966,
- "learning_rate": 4.888888888888889e-06,
- "loss": 0.0117,
- "step": 490
- },
- {
- "epoch": 50.0,
- "grad_norm": 0.05125224590301514,
- "learning_rate": 4.444444444444445e-07,
- "loss": 0.0105,
- "step": 500
- },
- {
- "epoch": 50.0,
- "eval_loss": 1.169873833656311,
- "eval_runtime": 1.7599,
- "eval_samples_per_second": 2.841,
- "eval_steps_per_second": 2.841,
- "step": 500
- }
- ],
- "logging_steps": 10,
- "max_steps": 500,
- "num_input_tokens_seen": 0,
- "num_train_epochs": 50,
- "save_steps": 100,
- "stateful_callbacks": {
- "TrainerControl": {
- "args": {
- "should_epoch_stop": false,
- "should_evaluate": false,
- "should_log": false,
- "should_save": true,
- "should_training_stop": true
- },
- "attributes": {}
- }
- },
- "total_flos": 6.63775195693056e+16,
- "train_batch_size": 1,
- "trial_name": null,
- "trial_params": null
-}
diff --git a/checkpoint-500/training_args.bin b/checkpoint-500/training_args.bin
deleted file mode 100644
index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000
--- a/checkpoint-500/training_args.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f
-size 5777
diff --git a/special_tokens_map.json b/special_tokens_map.json
deleted file mode 100644
index b90a4f3ca8530c09c5723f153257607c6fdabefc..0000000000000000000000000000000000000000
--- a/special_tokens_map.json
+++ /dev/null
@@ -1,40 +0,0 @@
-{
- "additional_special_tokens": [
- "▁
",
- "▁",
- "▁",
- "▁",
- "▁",
- "▁",
- "▁",
- "▁"
- ],
- "bos_token": {
- "content": "",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "eos_token": {
- "content": "",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "pad_token": {
- "content": "",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- },
- "unk_token": {
- "content": "",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false
- }
-}
diff --git a/tokenizer.json b/tokenizer.json
deleted file mode 100644
index fa5d179a4294feaa4747648098eaacd84fae3b98..0000000000000000000000000000000000000000
--- a/tokenizer.json
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:3db85ad6e5063687453d32b28de462a4fc7c6809c38c1b45326e2efe6e6fbee6
-size 3620984
diff --git a/tokenizer_config.json b/tokenizer_config.json
deleted file mode 100644
index f47206bd85c500c1451b5821065dfc19e7fc2372..0000000000000000000000000000000000000000
--- a/tokenizer_config.json
+++ /dev/null
@@ -1,95 +0,0 @@
-{
- "add_bos_token": true,
- "add_eos_token": false,
- "added_tokens_decoder": {
- "0": {
- "content": "",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "1": {
- "content": "",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "2": {
- "content": "",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "32007": {
- "content": "▁",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "32008": {
- "content": "▁",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "32009": {
- "content": "▁",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- },
- "32010": {
- "content": "▁",
- "lstrip": false,
- "normalized": false,
- "rstrip": false,
- "single_word": false,
- "special": true
- }
- },
- "additional_special_tokens": [
- "▁",
- "▁",
- "▁",
- "▁",
- "▁",
- "▁",
- "▁",
- "▁"
- ],
- "bos_token": "",
- "clean_up_tokenization_spaces": false,
- "eos_token": "",
- "eot_token": "▁",
- "extra_special_tokens": {},
- "fill_token": "",
- "legacy": null,
- "max_length": 2048,
- "middle_token": "▁",
- "model_max_length": 1000000000000000019884624838656,
- "pad_to_multiple_of": null,
- "pad_token": "",
- "pad_token_type_id": 0,
- "padding_side": "right",
- "prefix_token": "▁",
- "sp_model_kwargs": {},
- "stride": 0,
- "suffix_token": "▁",
- "tokenizer_class": "CodeLlamaTokenizerFast",
- "truncation_side": "right",
- "truncation_strategy": "longest_first",
- "unk_token": "",
- "use_default_system_prompt": false
-}
diff --git a/training_args.bin b/training_args.bin
deleted file mode 100644
index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000
--- a/training_args.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f
-size 5777