diff --git a/13B-ollama/anysecret-assistant-13B-Q4_K_M.gguf b/13B-ollama/anysecret-assistant-13B-Q4_K_M.gguf deleted file mode 100644 index 1989cfc6c3c4f52887e58fa6ca4fcd66f5814171..0000000000000000000000000000000000000000 --- a/13B-ollama/anysecret-assistant-13B-Q4_K_M.gguf +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f635699554afee39a40c05ddd8f9dc35ecfc9b31c754d6849c805d98128d3641 -size 7866071424 diff --git a/13B-ollama/anysecret-assistant-13B-Q5_K_M.gguf b/13B-ollama/anysecret-assistant-13B-Q5_K_M.gguf deleted file mode 100644 index 26b0b975dfdd66f87410a3a45fbed04114ebca9f..0000000000000000000000000000000000000000 --- a/13B-ollama/anysecret-assistant-13B-Q5_K_M.gguf +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ca7857afe8908510859f7f6fe18232a1efa93fe7dac0e6b0c177b2f6895fe5df -size 9230049664 diff --git a/13B-ollama/anysecret-assistant-13B-Q8_0.gguf b/13B-ollama/anysecret-assistant-13B-Q8_0.gguf deleted file mode 100644 index 1921ad47a2bf21bc298e9752917b2145391f58a3..0000000000000000000000000000000000000000 --- a/13B-ollama/anysecret-assistant-13B-Q8_0.gguf +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7c1c6ffab8eb447d2da08ce7cb2f70c398d9dd69ea509ae6f1f98aad33c410b6 -size 13831495424 diff --git a/adapter_config.json b/adapter_config.json deleted file mode 100644 index 2a47c2409fcec449ecdbcdde4b38627e50b56a0b..0000000000000000000000000000000000000000 --- a/adapter_config.json +++ /dev/null @@ -1,42 +0,0 @@ -{ - "alpha_pattern": {}, - "auto_mapping": null, - "base_model_name_or_path": "codellama/CodeLlama-13b-Instruct-hf", - "bias": "none", - "corda_config": null, - "eva_config": null, - "exclude_modules": null, - "fan_in_fan_out": false, - "inference_mode": true, - "init_lora_weights": true, - "layer_replication": null, - "layers_pattern": null, - "layers_to_transform": null, - "loftq_config": {}, - "lora_alpha": 32, - "lora_bias": false, - "lora_dropout": 0.1, - "megatron_config": null, - "megatron_core": "megatron.core", - "modules_to_save": null, - "peft_type": "LORA", - "qalora_group_size": 16, - "r": 16, - "rank_pattern": {}, - "revision": null, - "target_modules": [ - "up_proj", - "o_proj", - "gate_proj", - "down_proj", - "k_proj", - "q_proj", - "v_proj" - ], - "target_parameters": null, - "task_type": "CAUSAL_LM", - "trainable_token_indices": null, - "use_dora": false, - "use_qalora": false, - "use_rslora": false -} \ No newline at end of file diff --git a/adapter_model.safetensors b/adapter_model.safetensors deleted file mode 100644 index fe216c6a898cbd86be20675259ac5e461d2ca362..0000000000000000000000000000000000000000 --- a/adapter_model.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:491a381f62798faedfe204bdaf00433d1efc35b1a9ec968f59030ebe507aa61a -size 250422888 diff --git a/chat_template.jinja b/chat_template.jinja deleted file mode 100644 index 21dba1af1b9154e9140fe0ef5ca06d011b5004c8..0000000000000000000000000000000000000000 --- a/chat_template.jinja +++ /dev/null @@ -1 +0,0 @@ -{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}{% for message in loop_messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 and system_message != false %}{% set content = '<>\n' + system_message + '\n<>\n\n' + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ bos_token + '[INST] ' + content | trim + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content | trim + ' ' + eos_token }}{% endif %}{% endfor %} \ No newline at end of file diff --git a/checkpoint-100/README.md b/checkpoint-100/README.md deleted file mode 100644 index da869e54abd54b0fea18dcc9516b16918f684370..0000000000000000000000000000000000000000 --- a/checkpoint-100/README.md +++ /dev/null @@ -1,207 +0,0 @@ ---- -base_model: meta-llama/Llama-3.2-3B-Instruct -library_name: peft -pipeline_tag: text-generation -tags: -- base_model:adapter:meta-llama/Llama-3.2-3B-Instruct -- lora -- transformers ---- - -# Model Card for Model ID - - - - - -## Model Details - -### Model Description - - - - - -- **Developed by:** [More Information Needed] -- **Funded by [optional]:** [More Information Needed] -- **Shared by [optional]:** [More Information Needed] -- **Model type:** [More Information Needed] -- **Language(s) (NLP):** [More Information Needed] -- **License:** [More Information Needed] -- **Finetuned from model [optional]:** [More Information Needed] - -### Model Sources [optional] - - - -- **Repository:** [More Information Needed] -- **Paper [optional]:** [More Information Needed] -- **Demo [optional]:** [More Information Needed] - -## Uses - - - -### Direct Use - - - -[More Information Needed] - -### Downstream Use [optional] - - - -[More Information Needed] - -### Out-of-Scope Use - - - -[More Information Needed] - -## Bias, Risks, and Limitations - - - -[More Information Needed] - -### Recommendations - - - -Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. - -## How to Get Started with the Model - -Use the code below to get started with the model. - -[More Information Needed] - -## Training Details - -### Training Data - - - -[More Information Needed] - -### Training Procedure - - - -#### Preprocessing [optional] - -[More Information Needed] - - -#### Training Hyperparameters - -- **Training regime:** [More Information Needed] - -#### Speeds, Sizes, Times [optional] - - - -[More Information Needed] - -## Evaluation - - - -### Testing Data, Factors & Metrics - -#### Testing Data - - - -[More Information Needed] - -#### Factors - - - -[More Information Needed] - -#### Metrics - - - -[More Information Needed] - -### Results - -[More Information Needed] - -#### Summary - - - -## Model Examination [optional] - - - -[More Information Needed] - -## Environmental Impact - - - -Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). - -- **Hardware Type:** [More Information Needed] -- **Hours used:** [More Information Needed] -- **Cloud Provider:** [More Information Needed] -- **Compute Region:** [More Information Needed] -- **Carbon Emitted:** [More Information Needed] - -## Technical Specifications [optional] - -### Model Architecture and Objective - -[More Information Needed] - -### Compute Infrastructure - -[More Information Needed] - -#### Hardware - -[More Information Needed] - -#### Software - -[More Information Needed] - -## Citation [optional] - - - -**BibTeX:** - -[More Information Needed] - -**APA:** - -[More Information Needed] - -## Glossary [optional] - - - -[More Information Needed] - -## More Information [optional] - -[More Information Needed] - -## Model Card Authors [optional] - -[More Information Needed] - -## Model Card Contact - -[More Information Needed] -### Framework versions - -- PEFT 0.17.1 \ No newline at end of file diff --git a/checkpoint-100/adapter_config.json b/checkpoint-100/adapter_config.json deleted file mode 100644 index c9a27d527a89fd0081c994e17bd2b908b8038d6e..0000000000000000000000000000000000000000 --- a/checkpoint-100/adapter_config.json +++ /dev/null @@ -1,42 +0,0 @@ -{ - "alpha_pattern": {}, - "auto_mapping": null, - "base_model_name_or_path": "meta-llama/Llama-3.2-3B-Instruct", - "bias": "none", - "corda_config": null, - "eva_config": null, - "exclude_modules": null, - "fan_in_fan_out": false, - "inference_mode": true, - "init_lora_weights": true, - "layer_replication": null, - "layers_pattern": null, - "layers_to_transform": null, - "loftq_config": {}, - "lora_alpha": 32, - "lora_bias": false, - "lora_dropout": 0.1, - "megatron_config": null, - "megatron_core": "megatron.core", - "modules_to_save": null, - "peft_type": "LORA", - "qalora_group_size": 16, - "r": 16, - "rank_pattern": {}, - "revision": null, - "target_modules": [ - "down_proj", - "v_proj", - "q_proj", - "k_proj", - "gate_proj", - "o_proj", - "up_proj" - ], - "target_parameters": null, - "task_type": "CAUSAL_LM", - "trainable_token_indices": null, - "use_dora": false, - "use_qalora": false, - "use_rslora": false -} \ No newline at end of file diff --git a/checkpoint-100/adapter_model.safetensors b/checkpoint-100/adapter_model.safetensors deleted file mode 100644 index d0b49f3e9c4924545ee8d71a6a5c9740a61f4c6d..0000000000000000000000000000000000000000 --- a/checkpoint-100/adapter_model.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4fc6b553d80d4183d5a3cc772dccc582287021fa6ccce89b08c7e64930c0bdd5 -size 97307544 diff --git a/checkpoint-100/chat_template.jinja b/checkpoint-100/chat_template.jinja deleted file mode 100644 index 1bad6a0f648dccdbec523ca79ba90fbcfc806af0..0000000000000000000000000000000000000000 --- a/checkpoint-100/chat_template.jinja +++ /dev/null @@ -1,93 +0,0 @@ -{{- bos_token }} -{%- if custom_tools is defined %} - {%- set tools = custom_tools %} -{%- endif %} -{%- if not tools_in_user_message is defined %} - {%- set tools_in_user_message = true %} -{%- endif %} -{%- if not date_string is defined %} - {%- if strftime_now is defined %} - {%- set date_string = strftime_now("%d %b %Y") %} - {%- else %} - {%- set date_string = "26 Jul 2024" %} - {%- endif %} -{%- endif %} -{%- if not tools is defined %} - {%- set tools = none %} -{%- endif %} - -{#- This block extracts the system message, so we can slot it into the right place. #} -{%- if messages[0]['role'] == 'system' %} - {%- set system_message = messages[0]['content']|trim %} - {%- set messages = messages[1:] %} -{%- else %} - {%- set system_message = "" %} -{%- endif %} - -{#- System message #} -{{- "<|start_header_id|>system<|end_header_id|>\n\n" }} -{%- if tools is not none %} - {{- "Environment: ipython\n" }} -{%- endif %} -{{- "Cutting Knowledge Date: December 2023\n" }} -{{- "Today Date: " + date_string + "\n\n" }} -{%- if tools is not none and not tools_in_user_message %} - {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }} - {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} - {{- "Do not use variables.\n\n" }} - {%- for t in tools %} - {{- t | tojson(indent=4) }} - {{- "\n\n" }} - {%- endfor %} -{%- endif %} -{{- system_message }} -{{- "<|eot_id|>" }} - -{#- Custom tools are passed in a user message with some extra guidance #} -{%- if tools_in_user_message and not tools is none %} - {#- Extract the first user message so we can plug it in here #} - {%- if messages | length != 0 %} - {%- set first_user_message = messages[0]['content']|trim %} - {%- set messages = messages[1:] %} - {%- else %} - {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }} -{%- endif %} - {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}} - {{- "Given the following functions, please respond with a JSON for a function call " }} - {{- "with its proper arguments that best answers the given prompt.\n\n" }} - {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} - {{- "Do not use variables.\n\n" }} - {%- for t in tools %} - {{- t | tojson(indent=4) }} - {{- "\n\n" }} - {%- endfor %} - {{- first_user_message + "<|eot_id|>"}} -{%- endif %} - -{%- for message in messages %} - {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %} - {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }} - {%- elif 'tool_calls' in message %} - {%- if not message.tool_calls|length == 1 %} - {{- raise_exception("This model only supports single tool-calls at once!") }} - {%- endif %} - {%- set tool_call = message.tool_calls[0].function %} - {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}} - {{- '{"name": "' + tool_call.name + '", ' }} - {{- '"parameters": ' }} - {{- tool_call.arguments | tojson }} - {{- "}" }} - {{- "<|eot_id|>" }} - {%- elif message.role == "tool" or message.role == "ipython" %} - {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }} - {%- if message.content is mapping or message.content is iterable %} - {{- message.content | tojson }} - {%- else %} - {{- message.content }} - {%- endif %} - {{- "<|eot_id|>" }} - {%- endif %} -{%- endfor %} -{%- if add_generation_prompt %} - {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }} -{%- endif %} diff --git a/checkpoint-100/optimizer.pt b/checkpoint-100/optimizer.pt deleted file mode 100644 index 499bf6f0c269ddfb669b3d7e82633252d2c09e8d..0000000000000000000000000000000000000000 --- a/checkpoint-100/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f5a9c0ecb6f33b77d737e724fe719cc53e0d4cdf30efd01aaa73b310b58bf4ef -size 194846331 diff --git a/checkpoint-100/rng_state.pth b/checkpoint-100/rng_state.pth deleted file mode 100644 index ddf6f7dc00eefb78797f6a9017b7e05509310cbf..0000000000000000000000000000000000000000 --- a/checkpoint-100/rng_state.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:21eebf5c3ba6efdb5123bbdc37ec0bacf114ce7c5f26a6499a36b2a69fa2c90b -size 14645 diff --git a/checkpoint-100/scaler.pt b/checkpoint-100/scaler.pt deleted file mode 100644 index 215c5d2069bd81cb35727ebca07a510ac59c9d94..0000000000000000000000000000000000000000 --- a/checkpoint-100/scaler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c4393a84a3109995aa1202073b039b12062e3189ed89aa0b94ef0510ba843009 -size 1383 diff --git a/checkpoint-100/scheduler.pt b/checkpoint-100/scheduler.pt deleted file mode 100644 index 02d20dbc6bab763333a8ca7033099cc160ac21c8..0000000000000000000000000000000000000000 --- a/checkpoint-100/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d244377f57e78c692ea998e9ce93a7160134e1a3af6a39359aedc2d2aa9940c5 -size 1465 diff --git a/checkpoint-100/special_tokens_map.json b/checkpoint-100/special_tokens_map.json deleted file mode 100644 index b43be96621d147110fb8a18b5776ec6e38516127..0000000000000000000000000000000000000000 --- a/checkpoint-100/special_tokens_map.json +++ /dev/null @@ -1,17 +0,0 @@ -{ - "bos_token": { - "content": "<|begin_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false - }, - "eos_token": { - "content": "<|eot_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false - }, - "pad_token": "<|eot_id|>" -} diff --git a/checkpoint-100/tokenizer.json b/checkpoint-100/tokenizer.json deleted file mode 100644 index 8e89913d63cf04862fcbf301032ee349780489f2..0000000000000000000000000000000000000000 --- a/checkpoint-100/tokenizer.json +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:912e72517f7521f3273166a7879fe54c52b397f8c48ea80f8f1ed794beb24c09 -size 17210184 diff --git a/checkpoint-100/tokenizer_config.json b/checkpoint-100/tokenizer_config.json deleted file mode 100644 index 3beeacc86a6ca3cae14ad3004263ab74a4bac07a..0000000000000000000000000000000000000000 --- a/checkpoint-100/tokenizer_config.json +++ /dev/null @@ -1,2063 +0,0 @@ -{ - "added_tokens_decoder": { - "128000": { - "content": "<|begin_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128001": { - "content": "<|end_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128002": { - "content": "<|reserved_special_token_0|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128003": { - "content": "<|reserved_special_token_1|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128004": { - "content": "<|finetune_right_pad_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128005": { - "content": "<|reserved_special_token_2|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128006": { - "content": "<|start_header_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128007": { - "content": "<|end_header_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128008": { - "content": "<|eom_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128009": { - "content": "<|eot_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128010": { - "content": "<|python_tag|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128011": { - "content": "<|reserved_special_token_3|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128012": { - "content": "<|reserved_special_token_4|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128013": { - "content": "<|reserved_special_token_5|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128014": { - "content": "<|reserved_special_token_6|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128015": { - "content": "<|reserved_special_token_7|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128016": { - "content": "<|reserved_special_token_8|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128017": { - "content": "<|reserved_special_token_9|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128018": { - "content": "<|reserved_special_token_10|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128019": { - "content": "<|reserved_special_token_11|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128020": { - "content": "<|reserved_special_token_12|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128021": { - "content": "<|reserved_special_token_13|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128022": { - "content": "<|reserved_special_token_14|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128023": { - "content": "<|reserved_special_token_15|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128024": { - "content": "<|reserved_special_token_16|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128025": { - "content": "<|reserved_special_token_17|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128026": { - "content": "<|reserved_special_token_18|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128027": { - "content": "<|reserved_special_token_19|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128028": { - "content": "<|reserved_special_token_20|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128029": { - "content": "<|reserved_special_token_21|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128030": { - "content": "<|reserved_special_token_22|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128031": { - "content": "<|reserved_special_token_23|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128032": { - "content": "<|reserved_special_token_24|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128033": { - "content": "<|reserved_special_token_25|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128034": { - "content": "<|reserved_special_token_26|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128035": { - "content": "<|reserved_special_token_27|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128036": { - "content": "<|reserved_special_token_28|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128037": { - "content": "<|reserved_special_token_29|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128038": { - "content": "<|reserved_special_token_30|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128039": { - "content": "<|reserved_special_token_31|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128040": { - "content": "<|reserved_special_token_32|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128041": { - "content": "<|reserved_special_token_33|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128042": { - "content": "<|reserved_special_token_34|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128043": { - "content": "<|reserved_special_token_35|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128044": { - "content": "<|reserved_special_token_36|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128045": { - "content": "<|reserved_special_token_37|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128046": { - "content": "<|reserved_special_token_38|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128047": { - "content": "<|reserved_special_token_39|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128048": { - "content": "<|reserved_special_token_40|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128049": { - "content": "<|reserved_special_token_41|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128050": { - "content": "<|reserved_special_token_42|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128051": { - "content": "<|reserved_special_token_43|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128052": { - "content": "<|reserved_special_token_44|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128053": { - "content": "<|reserved_special_token_45|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128054": { - "content": "<|reserved_special_token_46|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128055": { - "content": "<|reserved_special_token_47|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128056": { - "content": "<|reserved_special_token_48|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128057": { - "content": "<|reserved_special_token_49|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128058": { - "content": "<|reserved_special_token_50|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128059": { - "content": "<|reserved_special_token_51|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128060": { - "content": "<|reserved_special_token_52|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128061": { - "content": "<|reserved_special_token_53|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128062": { - "content": "<|reserved_special_token_54|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128063": { - "content": "<|reserved_special_token_55|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128064": { - "content": "<|reserved_special_token_56|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128065": { - "content": "<|reserved_special_token_57|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128066": { - "content": "<|reserved_special_token_58|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128067": { - "content": "<|reserved_special_token_59|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128068": { - "content": "<|reserved_special_token_60|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128069": { - "content": "<|reserved_special_token_61|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128070": { - "content": "<|reserved_special_token_62|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128071": { - "content": "<|reserved_special_token_63|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128072": { - "content": "<|reserved_special_token_64|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128073": { - "content": "<|reserved_special_token_65|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128074": { - "content": "<|reserved_special_token_66|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128075": { - "content": "<|reserved_special_token_67|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128076": { - "content": "<|reserved_special_token_68|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128077": { - "content": "<|reserved_special_token_69|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128078": { - "content": "<|reserved_special_token_70|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128079": { - "content": "<|reserved_special_token_71|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128080": { - "content": "<|reserved_special_token_72|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128081": { - "content": "<|reserved_special_token_73|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128082": { - "content": "<|reserved_special_token_74|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128083": { - "content": "<|reserved_special_token_75|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128084": { - "content": "<|reserved_special_token_76|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128085": { - "content": "<|reserved_special_token_77|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128086": { - "content": "<|reserved_special_token_78|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128087": { - "content": "<|reserved_special_token_79|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128088": { - "content": "<|reserved_special_token_80|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128089": { - "content": "<|reserved_special_token_81|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128090": { - "content": "<|reserved_special_token_82|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128091": { - "content": "<|reserved_special_token_83|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128092": { - "content": "<|reserved_special_token_84|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128093": { - "content": "<|reserved_special_token_85|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128094": { - "content": "<|reserved_special_token_86|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128095": { - "content": "<|reserved_special_token_87|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128096": { - "content": "<|reserved_special_token_88|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128097": { - "content": "<|reserved_special_token_89|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128098": { - "content": "<|reserved_special_token_90|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128099": { - "content": "<|reserved_special_token_91|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128100": { - "content": "<|reserved_special_token_92|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128101": { - "content": "<|reserved_special_token_93|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128102": { - "content": "<|reserved_special_token_94|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128103": { - "content": "<|reserved_special_token_95|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128104": { - "content": "<|reserved_special_token_96|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128105": { - "content": "<|reserved_special_token_97|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128106": { - "content": "<|reserved_special_token_98|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128107": { - "content": "<|reserved_special_token_99|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128108": { - "content": "<|reserved_special_token_100|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128109": { - "content": "<|reserved_special_token_101|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128110": { - "content": "<|reserved_special_token_102|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128111": { - "content": "<|reserved_special_token_103|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128112": { - "content": "<|reserved_special_token_104|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128113": { - "content": "<|reserved_special_token_105|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128114": { - "content": "<|reserved_special_token_106|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128115": { - "content": "<|reserved_special_token_107|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128116": { - "content": "<|reserved_special_token_108|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128117": { - "content": "<|reserved_special_token_109|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128118": { - "content": "<|reserved_special_token_110|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128119": { - "content": "<|reserved_special_token_111|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128120": { - "content": "<|reserved_special_token_112|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128121": { - "content": "<|reserved_special_token_113|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128122": { - "content": "<|reserved_special_token_114|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128123": { - "content": "<|reserved_special_token_115|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128124": { - "content": "<|reserved_special_token_116|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128125": { - "content": "<|reserved_special_token_117|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128126": { - "content": "<|reserved_special_token_118|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128127": { - "content": "<|reserved_special_token_119|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128128": { - "content": "<|reserved_special_token_120|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128129": { - "content": "<|reserved_special_token_121|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128130": { - "content": "<|reserved_special_token_122|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128131": { - "content": "<|reserved_special_token_123|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128132": { - "content": "<|reserved_special_token_124|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128133": { - "content": "<|reserved_special_token_125|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128134": { - "content": "<|reserved_special_token_126|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128135": { - "content": "<|reserved_special_token_127|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128136": { - "content": "<|reserved_special_token_128|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128137": { - "content": "<|reserved_special_token_129|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128138": { - "content": "<|reserved_special_token_130|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128139": { - "content": "<|reserved_special_token_131|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128140": { - "content": "<|reserved_special_token_132|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128141": { - "content": "<|reserved_special_token_133|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128142": { - "content": "<|reserved_special_token_134|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128143": { - "content": "<|reserved_special_token_135|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128144": { - "content": "<|reserved_special_token_136|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128145": { - "content": "<|reserved_special_token_137|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128146": { - "content": "<|reserved_special_token_138|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128147": { - "content": "<|reserved_special_token_139|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128148": { - "content": "<|reserved_special_token_140|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128149": { - "content": "<|reserved_special_token_141|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128150": { - "content": "<|reserved_special_token_142|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128151": { - "content": "<|reserved_special_token_143|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128152": { - "content": "<|reserved_special_token_144|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128153": { - "content": "<|reserved_special_token_145|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128154": { - "content": "<|reserved_special_token_146|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128155": { - "content": "<|reserved_special_token_147|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128156": { - "content": "<|reserved_special_token_148|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128157": { - "content": "<|reserved_special_token_149|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128158": { - "content": "<|reserved_special_token_150|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128159": { - "content": "<|reserved_special_token_151|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128160": { - "content": "<|reserved_special_token_152|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128161": { - "content": "<|reserved_special_token_153|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128162": { - "content": "<|reserved_special_token_154|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128163": { - "content": "<|reserved_special_token_155|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128164": { - "content": "<|reserved_special_token_156|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128165": { - "content": "<|reserved_special_token_157|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128166": { - "content": "<|reserved_special_token_158|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128167": { - "content": "<|reserved_special_token_159|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128168": { - "content": "<|reserved_special_token_160|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128169": { - "content": "<|reserved_special_token_161|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128170": { - "content": "<|reserved_special_token_162|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128171": { - "content": "<|reserved_special_token_163|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128172": { - "content": "<|reserved_special_token_164|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128173": { - "content": "<|reserved_special_token_165|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128174": { - "content": "<|reserved_special_token_166|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128175": { - "content": "<|reserved_special_token_167|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128176": { - "content": "<|reserved_special_token_168|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128177": { - "content": "<|reserved_special_token_169|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128178": { - "content": "<|reserved_special_token_170|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128179": { - "content": "<|reserved_special_token_171|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128180": { - "content": "<|reserved_special_token_172|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128181": { - "content": "<|reserved_special_token_173|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128182": { - "content": "<|reserved_special_token_174|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128183": { - "content": "<|reserved_special_token_175|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128184": { - "content": "<|reserved_special_token_176|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128185": { - "content": "<|reserved_special_token_177|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128186": { - "content": "<|reserved_special_token_178|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128187": { - "content": "<|reserved_special_token_179|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128188": { - "content": "<|reserved_special_token_180|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128189": { - "content": "<|reserved_special_token_181|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128190": { - "content": "<|reserved_special_token_182|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128191": { - "content": "<|reserved_special_token_183|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128192": { - "content": "<|reserved_special_token_184|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128193": { - "content": "<|reserved_special_token_185|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128194": { - "content": "<|reserved_special_token_186|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128195": { - "content": "<|reserved_special_token_187|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128196": { - "content": "<|reserved_special_token_188|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128197": { - "content": "<|reserved_special_token_189|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128198": { - "content": "<|reserved_special_token_190|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128199": { - "content": "<|reserved_special_token_191|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128200": { - "content": "<|reserved_special_token_192|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128201": { - "content": "<|reserved_special_token_193|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128202": { - "content": "<|reserved_special_token_194|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128203": { - "content": "<|reserved_special_token_195|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128204": { - "content": "<|reserved_special_token_196|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128205": { - "content": "<|reserved_special_token_197|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128206": { - "content": "<|reserved_special_token_198|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128207": { - "content": "<|reserved_special_token_199|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128208": { - "content": "<|reserved_special_token_200|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128209": { - "content": "<|reserved_special_token_201|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128210": { - "content": "<|reserved_special_token_202|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128211": { - "content": "<|reserved_special_token_203|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128212": { - "content": "<|reserved_special_token_204|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128213": { - "content": "<|reserved_special_token_205|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128214": { - "content": "<|reserved_special_token_206|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128215": { - "content": "<|reserved_special_token_207|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128216": { - "content": "<|reserved_special_token_208|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128217": { - "content": "<|reserved_special_token_209|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128218": { - "content": "<|reserved_special_token_210|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128219": { - "content": "<|reserved_special_token_211|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128220": { - "content": "<|reserved_special_token_212|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128221": { - "content": "<|reserved_special_token_213|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128222": { - "content": "<|reserved_special_token_214|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128223": { - "content": "<|reserved_special_token_215|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128224": { - "content": "<|reserved_special_token_216|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128225": { - "content": "<|reserved_special_token_217|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128226": { - "content": "<|reserved_special_token_218|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128227": { - "content": "<|reserved_special_token_219|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128228": { - "content": "<|reserved_special_token_220|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128229": { - "content": "<|reserved_special_token_221|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128230": { - "content": "<|reserved_special_token_222|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128231": { - "content": "<|reserved_special_token_223|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128232": { - "content": "<|reserved_special_token_224|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128233": { - "content": "<|reserved_special_token_225|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128234": { - "content": "<|reserved_special_token_226|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128235": { - "content": "<|reserved_special_token_227|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128236": { - "content": "<|reserved_special_token_228|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128237": { - "content": "<|reserved_special_token_229|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128238": { - "content": "<|reserved_special_token_230|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128239": { - "content": "<|reserved_special_token_231|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128240": { - "content": "<|reserved_special_token_232|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128241": { - "content": "<|reserved_special_token_233|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128242": { - "content": "<|reserved_special_token_234|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128243": { - "content": "<|reserved_special_token_235|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128244": { - "content": "<|reserved_special_token_236|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128245": { - "content": "<|reserved_special_token_237|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128246": { - "content": "<|reserved_special_token_238|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128247": { - "content": "<|reserved_special_token_239|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128248": { - "content": "<|reserved_special_token_240|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128249": { - "content": "<|reserved_special_token_241|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128250": { - "content": "<|reserved_special_token_242|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128251": { - "content": "<|reserved_special_token_243|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128252": { - "content": "<|reserved_special_token_244|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128253": { - "content": "<|reserved_special_token_245|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128254": { - "content": "<|reserved_special_token_246|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128255": { - "content": "<|reserved_special_token_247|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - } - }, - "bos_token": "<|begin_of_text|>", - "clean_up_tokenization_spaces": true, - "eos_token": "<|eot_id|>", - "extra_special_tokens": {}, - "model_input_names": [ - "input_ids", - "attention_mask" - ], - "model_max_length": 131072, - "pad_token": "<|eot_id|>", - "tokenizer_class": "PreTrainedTokenizerFast" -} diff --git a/checkpoint-100/trainer_state.json b/checkpoint-100/trainer_state.json deleted file mode 100644 index b85b9bb52bc4fe431a14b79564908be103d2ae3e..0000000000000000000000000000000000000000 --- a/checkpoint-100/trainer_state.json +++ /dev/null @@ -1,120 +0,0 @@ -{ - "best_global_step": 50, - "best_metric": 0.7558398842811584, - "best_model_checkpoint": null, - "epoch": 10.0, - "eval_steps": 50, - "global_step": 100, - "is_hyper_param_search": false, - "is_local_process_zero": true, - "is_world_process_zero": true, - "log_history": [ - { - "epoch": 1.0, - "grad_norm": 1.4660576581954956, - "learning_rate": 3.6e-05, - "loss": 1.152, - "step": 10 - }, - { - "epoch": 2.0, - "grad_norm": 0.8749533295631409, - "learning_rate": 7.6e-05, - "loss": 1.0421, - "step": 20 - }, - { - "epoch": 3.0, - "grad_norm": 3.37060284614563, - "learning_rate": 0.000116, - "loss": 0.8539, - "step": 30 - }, - { - "epoch": 4.0, - "grad_norm": 1.5355278253555298, - "learning_rate": 0.00015600000000000002, - "loss": 0.5483, - "step": 40 - }, - { - "epoch": 5.0, - "grad_norm": 2.454838514328003, - "learning_rate": 0.000196, - "loss": 0.3736, - "step": 50 - }, - { - "epoch": 5.0, - "eval_loss": 0.7558398842811584, - "eval_runtime": 1.7227, - "eval_samples_per_second": 2.902, - "eval_steps_per_second": 2.902, - "step": 50 - }, - { - "epoch": 6.0, - "grad_norm": 3.676417827606201, - "learning_rate": 0.000196, - "loss": 0.2291, - "step": 60 - }, - { - "epoch": 7.0, - "grad_norm": 2.192375898361206, - "learning_rate": 0.00019155555555555554, - "loss": 0.1244, - "step": 70 - }, - { - "epoch": 8.0, - "grad_norm": 2.630005359649658, - "learning_rate": 0.00018711111111111112, - "loss": 0.0862, - "step": 80 - }, - { - "epoch": 9.0, - "grad_norm": 0.5021786093711853, - "learning_rate": 0.00018266666666666667, - "loss": 0.0614, - "step": 90 - }, - { - "epoch": 10.0, - "grad_norm": 0.38170942664146423, - "learning_rate": 0.00017822222222222222, - "loss": 0.0471, - "step": 100 - }, - { - "epoch": 10.0, - "eval_loss": 0.8806974291801453, - "eval_runtime": 1.7764, - "eval_samples_per_second": 2.815, - "eval_steps_per_second": 2.815, - "step": 100 - } - ], - "logging_steps": 10, - "max_steps": 500, - "num_input_tokens_seen": 0, - "num_train_epochs": 50, - "save_steps": 100, - "stateful_callbacks": { - "TrainerControl": { - "args": { - "should_epoch_stop": false, - "should_evaluate": false, - "should_log": false, - "should_save": true, - "should_training_stop": false - }, - "attributes": {} - } - }, - "total_flos": 1.327550391386112e+16, - "train_batch_size": 1, - "trial_name": null, - "trial_params": null -} diff --git a/checkpoint-100/training_args.bin b/checkpoint-100/training_args.bin deleted file mode 100644 index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000 --- a/checkpoint-100/training_args.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f -size 5777 diff --git a/checkpoint-200/README.md b/checkpoint-200/README.md deleted file mode 100644 index da869e54abd54b0fea18dcc9516b16918f684370..0000000000000000000000000000000000000000 --- a/checkpoint-200/README.md +++ /dev/null @@ -1,207 +0,0 @@ ---- -base_model: meta-llama/Llama-3.2-3B-Instruct -library_name: peft -pipeline_tag: text-generation -tags: -- base_model:adapter:meta-llama/Llama-3.2-3B-Instruct -- lora -- transformers ---- - -# Model Card for Model ID - - - - - -## Model Details - -### Model Description - - - - - -- **Developed by:** [More Information Needed] -- **Funded by [optional]:** [More Information Needed] -- **Shared by [optional]:** [More Information Needed] -- **Model type:** [More Information Needed] -- **Language(s) (NLP):** [More Information Needed] -- **License:** [More Information Needed] -- **Finetuned from model [optional]:** [More Information Needed] - -### Model Sources [optional] - - - -- **Repository:** [More Information Needed] -- **Paper [optional]:** [More Information Needed] -- **Demo [optional]:** [More Information Needed] - -## Uses - - - -### Direct Use - - - -[More Information Needed] - -### Downstream Use [optional] - - - -[More Information Needed] - -### Out-of-Scope Use - - - -[More Information Needed] - -## Bias, Risks, and Limitations - - - -[More Information Needed] - -### Recommendations - - - -Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. - -## How to Get Started with the Model - -Use the code below to get started with the model. - -[More Information Needed] - -## Training Details - -### Training Data - - - -[More Information Needed] - -### Training Procedure - - - -#### Preprocessing [optional] - -[More Information Needed] - - -#### Training Hyperparameters - -- **Training regime:** [More Information Needed] - -#### Speeds, Sizes, Times [optional] - - - -[More Information Needed] - -## Evaluation - - - -### Testing Data, Factors & Metrics - -#### Testing Data - - - -[More Information Needed] - -#### Factors - - - -[More Information Needed] - -#### Metrics - - - -[More Information Needed] - -### Results - -[More Information Needed] - -#### Summary - - - -## Model Examination [optional] - - - -[More Information Needed] - -## Environmental Impact - - - -Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). - -- **Hardware Type:** [More Information Needed] -- **Hours used:** [More Information Needed] -- **Cloud Provider:** [More Information Needed] -- **Compute Region:** [More Information Needed] -- **Carbon Emitted:** [More Information Needed] - -## Technical Specifications [optional] - -### Model Architecture and Objective - -[More Information Needed] - -### Compute Infrastructure - -[More Information Needed] - -#### Hardware - -[More Information Needed] - -#### Software - -[More Information Needed] - -## Citation [optional] - - - -**BibTeX:** - -[More Information Needed] - -**APA:** - -[More Information Needed] - -## Glossary [optional] - - - -[More Information Needed] - -## More Information [optional] - -[More Information Needed] - -## Model Card Authors [optional] - -[More Information Needed] - -## Model Card Contact - -[More Information Needed] -### Framework versions - -- PEFT 0.17.1 \ No newline at end of file diff --git a/checkpoint-200/adapter_config.json b/checkpoint-200/adapter_config.json deleted file mode 100644 index c9a27d527a89fd0081c994e17bd2b908b8038d6e..0000000000000000000000000000000000000000 --- a/checkpoint-200/adapter_config.json +++ /dev/null @@ -1,42 +0,0 @@ -{ - "alpha_pattern": {}, - "auto_mapping": null, - "base_model_name_or_path": "meta-llama/Llama-3.2-3B-Instruct", - "bias": "none", - "corda_config": null, - "eva_config": null, - "exclude_modules": null, - "fan_in_fan_out": false, - "inference_mode": true, - "init_lora_weights": true, - "layer_replication": null, - "layers_pattern": null, - "layers_to_transform": null, - "loftq_config": {}, - "lora_alpha": 32, - "lora_bias": false, - "lora_dropout": 0.1, - "megatron_config": null, - "megatron_core": "megatron.core", - "modules_to_save": null, - "peft_type": "LORA", - "qalora_group_size": 16, - "r": 16, - "rank_pattern": {}, - "revision": null, - "target_modules": [ - "down_proj", - "v_proj", - "q_proj", - "k_proj", - "gate_proj", - "o_proj", - "up_proj" - ], - "target_parameters": null, - "task_type": "CAUSAL_LM", - "trainable_token_indices": null, - "use_dora": false, - "use_qalora": false, - "use_rslora": false -} \ No newline at end of file diff --git a/checkpoint-200/adapter_model.safetensors b/checkpoint-200/adapter_model.safetensors deleted file mode 100644 index 2b3fa85b7a0b2b881f5ad32e10c70d80a5846133..0000000000000000000000000000000000000000 --- a/checkpoint-200/adapter_model.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:10f314568bf765a9d52faf4b26b09d687304a1e227e75be06f046a06de38812a -size 97307544 diff --git a/checkpoint-200/chat_template.jinja b/checkpoint-200/chat_template.jinja deleted file mode 100644 index 1bad6a0f648dccdbec523ca79ba90fbcfc806af0..0000000000000000000000000000000000000000 --- a/checkpoint-200/chat_template.jinja +++ /dev/null @@ -1,93 +0,0 @@ -{{- bos_token }} -{%- if custom_tools is defined %} - {%- set tools = custom_tools %} -{%- endif %} -{%- if not tools_in_user_message is defined %} - {%- set tools_in_user_message = true %} -{%- endif %} -{%- if not date_string is defined %} - {%- if strftime_now is defined %} - {%- set date_string = strftime_now("%d %b %Y") %} - {%- else %} - {%- set date_string = "26 Jul 2024" %} - {%- endif %} -{%- endif %} -{%- if not tools is defined %} - {%- set tools = none %} -{%- endif %} - -{#- This block extracts the system message, so we can slot it into the right place. #} -{%- if messages[0]['role'] == 'system' %} - {%- set system_message = messages[0]['content']|trim %} - {%- set messages = messages[1:] %} -{%- else %} - {%- set system_message = "" %} -{%- endif %} - -{#- System message #} -{{- "<|start_header_id|>system<|end_header_id|>\n\n" }} -{%- if tools is not none %} - {{- "Environment: ipython\n" }} -{%- endif %} -{{- "Cutting Knowledge Date: December 2023\n" }} -{{- "Today Date: " + date_string + "\n\n" }} -{%- if tools is not none and not tools_in_user_message %} - {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }} - {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} - {{- "Do not use variables.\n\n" }} - {%- for t in tools %} - {{- t | tojson(indent=4) }} - {{- "\n\n" }} - {%- endfor %} -{%- endif %} -{{- system_message }} -{{- "<|eot_id|>" }} - -{#- Custom tools are passed in a user message with some extra guidance #} -{%- if tools_in_user_message and not tools is none %} - {#- Extract the first user message so we can plug it in here #} - {%- if messages | length != 0 %} - {%- set first_user_message = messages[0]['content']|trim %} - {%- set messages = messages[1:] %} - {%- else %} - {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }} -{%- endif %} - {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}} - {{- "Given the following functions, please respond with a JSON for a function call " }} - {{- "with its proper arguments that best answers the given prompt.\n\n" }} - {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} - {{- "Do not use variables.\n\n" }} - {%- for t in tools %} - {{- t | tojson(indent=4) }} - {{- "\n\n" }} - {%- endfor %} - {{- first_user_message + "<|eot_id|>"}} -{%- endif %} - -{%- for message in messages %} - {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %} - {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }} - {%- elif 'tool_calls' in message %} - {%- if not message.tool_calls|length == 1 %} - {{- raise_exception("This model only supports single tool-calls at once!") }} - {%- endif %} - {%- set tool_call = message.tool_calls[0].function %} - {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}} - {{- '{"name": "' + tool_call.name + '", ' }} - {{- '"parameters": ' }} - {{- tool_call.arguments | tojson }} - {{- "}" }} - {{- "<|eot_id|>" }} - {%- elif message.role == "tool" or message.role == "ipython" %} - {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }} - {%- if message.content is mapping or message.content is iterable %} - {{- message.content | tojson }} - {%- else %} - {{- message.content }} - {%- endif %} - {{- "<|eot_id|>" }} - {%- endif %} -{%- endfor %} -{%- if add_generation_prompt %} - {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }} -{%- endif %} diff --git a/checkpoint-200/optimizer.pt b/checkpoint-200/optimizer.pt deleted file mode 100644 index f3b02add2d4ca6a44295d48814dd6b7f776e823b..0000000000000000000000000000000000000000 --- a/checkpoint-200/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b6e4054c31ada60cdc2d5abc92ee7ae6a394f2aee4f62444f6182af065065469 -size 194846331 diff --git a/checkpoint-200/rng_state.pth b/checkpoint-200/rng_state.pth deleted file mode 100644 index f90d2ea69ed0322133c0a511dcd98aef2e801910..0000000000000000000000000000000000000000 --- a/checkpoint-200/rng_state.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5d4b19975224e425acc366825a1e7970a459487fa7a57ffeb1a94ad4de25fa1d -size 14645 diff --git a/checkpoint-200/scaler.pt b/checkpoint-200/scaler.pt deleted file mode 100644 index dce3572b315210d751b935f42f897c650110e0c7..0000000000000000000000000000000000000000 --- a/checkpoint-200/scaler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:124625e167eb28acbfc793cfcb3e8a08b32e7fea06501462bc9e420a5e1beb2a -size 1383 diff --git a/checkpoint-200/scheduler.pt b/checkpoint-200/scheduler.pt deleted file mode 100644 index 6293f8e8c13cfc93b4ba1fb58087d97a20041222..0000000000000000000000000000000000000000 --- a/checkpoint-200/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:37315ef08bfa8057ff315cea8e5349272ef9591e350519ec1b303f17a237220b -size 1465 diff --git a/checkpoint-200/special_tokens_map.json b/checkpoint-200/special_tokens_map.json deleted file mode 100644 index b43be96621d147110fb8a18b5776ec6e38516127..0000000000000000000000000000000000000000 --- a/checkpoint-200/special_tokens_map.json +++ /dev/null @@ -1,17 +0,0 @@ -{ - "bos_token": { - "content": "<|begin_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false - }, - "eos_token": { - "content": "<|eot_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false - }, - "pad_token": "<|eot_id|>" -} diff --git a/checkpoint-200/tokenizer.json b/checkpoint-200/tokenizer.json deleted file mode 100644 index 8e89913d63cf04862fcbf301032ee349780489f2..0000000000000000000000000000000000000000 --- a/checkpoint-200/tokenizer.json +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:912e72517f7521f3273166a7879fe54c52b397f8c48ea80f8f1ed794beb24c09 -size 17210184 diff --git a/checkpoint-200/tokenizer_config.json b/checkpoint-200/tokenizer_config.json deleted file mode 100644 index 3beeacc86a6ca3cae14ad3004263ab74a4bac07a..0000000000000000000000000000000000000000 --- a/checkpoint-200/tokenizer_config.json +++ /dev/null @@ -1,2063 +0,0 @@ -{ - "added_tokens_decoder": { - "128000": { - "content": "<|begin_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128001": { - "content": "<|end_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128002": { - "content": "<|reserved_special_token_0|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128003": { - "content": "<|reserved_special_token_1|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128004": { - "content": "<|finetune_right_pad_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128005": { - "content": "<|reserved_special_token_2|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128006": { - "content": "<|start_header_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128007": { - "content": "<|end_header_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128008": { - "content": "<|eom_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128009": { - "content": "<|eot_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128010": { - "content": "<|python_tag|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128011": { - "content": "<|reserved_special_token_3|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128012": { - "content": "<|reserved_special_token_4|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128013": { - "content": "<|reserved_special_token_5|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128014": { - "content": "<|reserved_special_token_6|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128015": { - "content": "<|reserved_special_token_7|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128016": { - "content": "<|reserved_special_token_8|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128017": { - "content": "<|reserved_special_token_9|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128018": { - "content": "<|reserved_special_token_10|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128019": { - "content": "<|reserved_special_token_11|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128020": { - "content": "<|reserved_special_token_12|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128021": { - "content": "<|reserved_special_token_13|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128022": { - "content": "<|reserved_special_token_14|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128023": { - "content": "<|reserved_special_token_15|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128024": { - "content": "<|reserved_special_token_16|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128025": { - "content": "<|reserved_special_token_17|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128026": { - "content": "<|reserved_special_token_18|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128027": { - "content": "<|reserved_special_token_19|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128028": { - "content": "<|reserved_special_token_20|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128029": { - "content": "<|reserved_special_token_21|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128030": { - "content": "<|reserved_special_token_22|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128031": { - "content": "<|reserved_special_token_23|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128032": { - "content": "<|reserved_special_token_24|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128033": { - "content": "<|reserved_special_token_25|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128034": { - "content": "<|reserved_special_token_26|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128035": { - "content": "<|reserved_special_token_27|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128036": { - "content": "<|reserved_special_token_28|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128037": { - "content": "<|reserved_special_token_29|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128038": { - "content": "<|reserved_special_token_30|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128039": { - "content": "<|reserved_special_token_31|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128040": { - "content": "<|reserved_special_token_32|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128041": { - "content": "<|reserved_special_token_33|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128042": { - "content": "<|reserved_special_token_34|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128043": { - "content": "<|reserved_special_token_35|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128044": { - "content": "<|reserved_special_token_36|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128045": { - "content": "<|reserved_special_token_37|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128046": { - "content": "<|reserved_special_token_38|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128047": { - "content": "<|reserved_special_token_39|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128048": { - "content": "<|reserved_special_token_40|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128049": { - "content": "<|reserved_special_token_41|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128050": { - "content": "<|reserved_special_token_42|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128051": { - "content": "<|reserved_special_token_43|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128052": { - "content": "<|reserved_special_token_44|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128053": { - "content": "<|reserved_special_token_45|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128054": { - "content": "<|reserved_special_token_46|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128055": { - "content": "<|reserved_special_token_47|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128056": { - "content": "<|reserved_special_token_48|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128057": { - "content": "<|reserved_special_token_49|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128058": { - "content": "<|reserved_special_token_50|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128059": { - "content": "<|reserved_special_token_51|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128060": { - "content": "<|reserved_special_token_52|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128061": { - "content": "<|reserved_special_token_53|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128062": { - "content": "<|reserved_special_token_54|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128063": { - "content": "<|reserved_special_token_55|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128064": { - "content": "<|reserved_special_token_56|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128065": { - "content": "<|reserved_special_token_57|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128066": { - "content": "<|reserved_special_token_58|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128067": { - "content": "<|reserved_special_token_59|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128068": { - "content": "<|reserved_special_token_60|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128069": { - "content": "<|reserved_special_token_61|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128070": { - "content": "<|reserved_special_token_62|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128071": { - "content": "<|reserved_special_token_63|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128072": { - "content": "<|reserved_special_token_64|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128073": { - "content": "<|reserved_special_token_65|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128074": { - "content": "<|reserved_special_token_66|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128075": { - "content": "<|reserved_special_token_67|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128076": { - "content": "<|reserved_special_token_68|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128077": { - "content": "<|reserved_special_token_69|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128078": { - "content": "<|reserved_special_token_70|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128079": { - "content": "<|reserved_special_token_71|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128080": { - "content": "<|reserved_special_token_72|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128081": { - "content": "<|reserved_special_token_73|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128082": { - "content": "<|reserved_special_token_74|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128083": { - "content": "<|reserved_special_token_75|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128084": { - "content": "<|reserved_special_token_76|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128085": { - "content": "<|reserved_special_token_77|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128086": { - "content": "<|reserved_special_token_78|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128087": { - "content": "<|reserved_special_token_79|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128088": { - "content": "<|reserved_special_token_80|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128089": { - "content": "<|reserved_special_token_81|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128090": { - "content": "<|reserved_special_token_82|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128091": { - "content": "<|reserved_special_token_83|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128092": { - "content": "<|reserved_special_token_84|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128093": { - "content": "<|reserved_special_token_85|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128094": { - "content": "<|reserved_special_token_86|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128095": { - "content": "<|reserved_special_token_87|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128096": { - "content": "<|reserved_special_token_88|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128097": { - "content": "<|reserved_special_token_89|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128098": { - "content": "<|reserved_special_token_90|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128099": { - "content": "<|reserved_special_token_91|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128100": { - "content": "<|reserved_special_token_92|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128101": { - "content": "<|reserved_special_token_93|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128102": { - "content": "<|reserved_special_token_94|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128103": { - "content": "<|reserved_special_token_95|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128104": { - "content": "<|reserved_special_token_96|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128105": { - "content": "<|reserved_special_token_97|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128106": { - "content": "<|reserved_special_token_98|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128107": { - "content": "<|reserved_special_token_99|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128108": { - "content": "<|reserved_special_token_100|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128109": { - "content": "<|reserved_special_token_101|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128110": { - "content": "<|reserved_special_token_102|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128111": { - "content": "<|reserved_special_token_103|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128112": { - "content": "<|reserved_special_token_104|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128113": { - "content": "<|reserved_special_token_105|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128114": { - "content": "<|reserved_special_token_106|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128115": { - "content": "<|reserved_special_token_107|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128116": { - "content": "<|reserved_special_token_108|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128117": { - "content": "<|reserved_special_token_109|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128118": { - "content": "<|reserved_special_token_110|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128119": { - "content": "<|reserved_special_token_111|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128120": { - "content": "<|reserved_special_token_112|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128121": { - "content": "<|reserved_special_token_113|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128122": { - "content": "<|reserved_special_token_114|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128123": { - "content": "<|reserved_special_token_115|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128124": { - "content": "<|reserved_special_token_116|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128125": { - "content": "<|reserved_special_token_117|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128126": { - "content": "<|reserved_special_token_118|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128127": { - "content": "<|reserved_special_token_119|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128128": { - "content": "<|reserved_special_token_120|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128129": { - "content": "<|reserved_special_token_121|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128130": { - "content": "<|reserved_special_token_122|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128131": { - "content": "<|reserved_special_token_123|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128132": { - "content": "<|reserved_special_token_124|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128133": { - "content": "<|reserved_special_token_125|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128134": { - "content": "<|reserved_special_token_126|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128135": { - "content": "<|reserved_special_token_127|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128136": { - "content": "<|reserved_special_token_128|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128137": { - "content": "<|reserved_special_token_129|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128138": { - "content": "<|reserved_special_token_130|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128139": { - "content": "<|reserved_special_token_131|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128140": { - "content": "<|reserved_special_token_132|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128141": { - "content": "<|reserved_special_token_133|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128142": { - "content": "<|reserved_special_token_134|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128143": { - "content": "<|reserved_special_token_135|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128144": { - "content": "<|reserved_special_token_136|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128145": { - "content": "<|reserved_special_token_137|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128146": { - "content": "<|reserved_special_token_138|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128147": { - "content": "<|reserved_special_token_139|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128148": { - "content": "<|reserved_special_token_140|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128149": { - "content": "<|reserved_special_token_141|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128150": { - "content": "<|reserved_special_token_142|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128151": { - "content": "<|reserved_special_token_143|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128152": { - "content": "<|reserved_special_token_144|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128153": { - "content": "<|reserved_special_token_145|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128154": { - "content": "<|reserved_special_token_146|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128155": { - "content": "<|reserved_special_token_147|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128156": { - "content": "<|reserved_special_token_148|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128157": { - "content": "<|reserved_special_token_149|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128158": { - "content": "<|reserved_special_token_150|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128159": { - "content": "<|reserved_special_token_151|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128160": { - "content": "<|reserved_special_token_152|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128161": { - "content": "<|reserved_special_token_153|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128162": { - "content": "<|reserved_special_token_154|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128163": { - "content": "<|reserved_special_token_155|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128164": { - "content": "<|reserved_special_token_156|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128165": { - "content": "<|reserved_special_token_157|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128166": { - "content": "<|reserved_special_token_158|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128167": { - "content": "<|reserved_special_token_159|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128168": { - "content": "<|reserved_special_token_160|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128169": { - "content": "<|reserved_special_token_161|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128170": { - "content": "<|reserved_special_token_162|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128171": { - "content": "<|reserved_special_token_163|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128172": { - "content": "<|reserved_special_token_164|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128173": { - "content": "<|reserved_special_token_165|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128174": { - "content": "<|reserved_special_token_166|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128175": { - "content": "<|reserved_special_token_167|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128176": { - "content": "<|reserved_special_token_168|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128177": { - "content": "<|reserved_special_token_169|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128178": { - "content": "<|reserved_special_token_170|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128179": { - "content": "<|reserved_special_token_171|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128180": { - "content": "<|reserved_special_token_172|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128181": { - "content": "<|reserved_special_token_173|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128182": { - "content": "<|reserved_special_token_174|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128183": { - "content": "<|reserved_special_token_175|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128184": { - "content": "<|reserved_special_token_176|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128185": { - "content": "<|reserved_special_token_177|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128186": { - "content": "<|reserved_special_token_178|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128187": { - "content": "<|reserved_special_token_179|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128188": { - "content": "<|reserved_special_token_180|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128189": { - "content": "<|reserved_special_token_181|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128190": { - "content": "<|reserved_special_token_182|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128191": { - "content": "<|reserved_special_token_183|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128192": { - "content": "<|reserved_special_token_184|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128193": { - "content": "<|reserved_special_token_185|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128194": { - "content": "<|reserved_special_token_186|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128195": { - "content": "<|reserved_special_token_187|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128196": { - "content": "<|reserved_special_token_188|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128197": { - "content": "<|reserved_special_token_189|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128198": { - "content": "<|reserved_special_token_190|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128199": { - "content": "<|reserved_special_token_191|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128200": { - "content": "<|reserved_special_token_192|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128201": { - "content": "<|reserved_special_token_193|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128202": { - "content": "<|reserved_special_token_194|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128203": { - "content": "<|reserved_special_token_195|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128204": { - "content": "<|reserved_special_token_196|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128205": { - "content": "<|reserved_special_token_197|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128206": { - "content": "<|reserved_special_token_198|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128207": { - "content": "<|reserved_special_token_199|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128208": { - "content": "<|reserved_special_token_200|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128209": { - "content": "<|reserved_special_token_201|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128210": { - "content": "<|reserved_special_token_202|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128211": { - "content": "<|reserved_special_token_203|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128212": { - "content": "<|reserved_special_token_204|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128213": { - "content": "<|reserved_special_token_205|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128214": { - "content": "<|reserved_special_token_206|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128215": { - "content": "<|reserved_special_token_207|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128216": { - "content": "<|reserved_special_token_208|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128217": { - "content": "<|reserved_special_token_209|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128218": { - "content": "<|reserved_special_token_210|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128219": { - "content": "<|reserved_special_token_211|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128220": { - "content": "<|reserved_special_token_212|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128221": { - "content": "<|reserved_special_token_213|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128222": { - "content": "<|reserved_special_token_214|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128223": { - "content": "<|reserved_special_token_215|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128224": { - "content": "<|reserved_special_token_216|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128225": { - "content": "<|reserved_special_token_217|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128226": { - "content": "<|reserved_special_token_218|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128227": { - "content": "<|reserved_special_token_219|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128228": { - "content": "<|reserved_special_token_220|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128229": { - "content": "<|reserved_special_token_221|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128230": { - "content": "<|reserved_special_token_222|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128231": { - "content": "<|reserved_special_token_223|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128232": { - "content": "<|reserved_special_token_224|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128233": { - "content": "<|reserved_special_token_225|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128234": { - "content": "<|reserved_special_token_226|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128235": { - "content": "<|reserved_special_token_227|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128236": { - "content": "<|reserved_special_token_228|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128237": { - "content": "<|reserved_special_token_229|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128238": { - "content": "<|reserved_special_token_230|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128239": { - "content": "<|reserved_special_token_231|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128240": { - "content": "<|reserved_special_token_232|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128241": { - "content": "<|reserved_special_token_233|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128242": { - "content": "<|reserved_special_token_234|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128243": { - "content": "<|reserved_special_token_235|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128244": { - "content": "<|reserved_special_token_236|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128245": { - "content": "<|reserved_special_token_237|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128246": { - "content": "<|reserved_special_token_238|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128247": { - "content": "<|reserved_special_token_239|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128248": { - "content": "<|reserved_special_token_240|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128249": { - "content": "<|reserved_special_token_241|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128250": { - "content": "<|reserved_special_token_242|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128251": { - "content": "<|reserved_special_token_243|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128252": { - "content": "<|reserved_special_token_244|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128253": { - "content": "<|reserved_special_token_245|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128254": { - "content": "<|reserved_special_token_246|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128255": { - "content": "<|reserved_special_token_247|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - } - }, - "bos_token": "<|begin_of_text|>", - "clean_up_tokenization_spaces": true, - "eos_token": "<|eot_id|>", - "extra_special_tokens": {}, - "model_input_names": [ - "input_ids", - "attention_mask" - ], - "model_max_length": 131072, - "pad_token": "<|eot_id|>", - "tokenizer_class": "PreTrainedTokenizerFast" -} diff --git a/checkpoint-200/trainer_state.json b/checkpoint-200/trainer_state.json deleted file mode 100644 index f3e9d0600dc1755fa0c2b644f7857612aedbc180..0000000000000000000000000000000000000000 --- a/checkpoint-200/trainer_state.json +++ /dev/null @@ -1,206 +0,0 @@ -{ - "best_global_step": 50, - "best_metric": 0.7558398842811584, - "best_model_checkpoint": null, - "epoch": 20.0, - "eval_steps": 50, - "global_step": 200, - "is_hyper_param_search": false, - "is_local_process_zero": true, - "is_world_process_zero": true, - "log_history": [ - { - "epoch": 1.0, - "grad_norm": 1.4660576581954956, - "learning_rate": 3.6e-05, - "loss": 1.152, - "step": 10 - }, - { - "epoch": 2.0, - "grad_norm": 0.8749533295631409, - "learning_rate": 7.6e-05, - "loss": 1.0421, - "step": 20 - }, - { - "epoch": 3.0, - "grad_norm": 3.37060284614563, - "learning_rate": 0.000116, - "loss": 0.8539, - "step": 30 - }, - { - "epoch": 4.0, - "grad_norm": 1.5355278253555298, - "learning_rate": 0.00015600000000000002, - "loss": 0.5483, - "step": 40 - }, - { - "epoch": 5.0, - "grad_norm": 2.454838514328003, - "learning_rate": 0.000196, - "loss": 0.3736, - "step": 50 - }, - { - "epoch": 5.0, - "eval_loss": 0.7558398842811584, - "eval_runtime": 1.7227, - "eval_samples_per_second": 2.902, - "eval_steps_per_second": 2.902, - "step": 50 - }, - { - "epoch": 6.0, - "grad_norm": 3.676417827606201, - "learning_rate": 0.000196, - "loss": 0.2291, - "step": 60 - }, - { - "epoch": 7.0, - "grad_norm": 2.192375898361206, - "learning_rate": 0.00019155555555555554, - "loss": 0.1244, - "step": 70 - }, - { - "epoch": 8.0, - "grad_norm": 2.630005359649658, - "learning_rate": 0.00018711111111111112, - "loss": 0.0862, - "step": 80 - }, - { - "epoch": 9.0, - "grad_norm": 0.5021786093711853, - "learning_rate": 0.00018266666666666667, - "loss": 0.0614, - "step": 90 - }, - { - "epoch": 10.0, - "grad_norm": 0.38170942664146423, - "learning_rate": 0.00017822222222222222, - "loss": 0.0471, - "step": 100 - }, - { - "epoch": 10.0, - "eval_loss": 0.8806974291801453, - "eval_runtime": 1.7764, - "eval_samples_per_second": 2.815, - "eval_steps_per_second": 2.815, - "step": 100 - }, - { - "epoch": 11.0, - "grad_norm": 1.223647952079773, - "learning_rate": 0.0001737777777777778, - "loss": 0.0359, - "step": 110 - }, - { - "epoch": 12.0, - "grad_norm": 0.5452818870544434, - "learning_rate": 0.00016933333333333335, - "loss": 0.0289, - "step": 120 - }, - { - "epoch": 13.0, - "grad_norm": 0.19034886360168457, - "learning_rate": 0.0001648888888888889, - "loss": 0.029, - "step": 130 - }, - { - "epoch": 14.0, - "grad_norm": 0.7483140230178833, - "learning_rate": 0.00016044444444444445, - "loss": 0.0247, - "step": 140 - }, - { - "epoch": 15.0, - "grad_norm": 0.34800082445144653, - "learning_rate": 0.00015600000000000002, - "loss": 0.0193, - "step": 150 - }, - { - "epoch": 15.0, - "eval_loss": 0.9916993379592896, - "eval_runtime": 1.7667, - "eval_samples_per_second": 2.83, - "eval_steps_per_second": 2.83, - "step": 150 - }, - { - "epoch": 16.0, - "grad_norm": 0.24237586557865143, - "learning_rate": 0.00015155555555555557, - "loss": 0.0176, - "step": 160 - }, - { - "epoch": 17.0, - "grad_norm": 0.13607177138328552, - "learning_rate": 0.00014711111111111112, - "loss": 0.0131, - "step": 170 - }, - { - "epoch": 18.0, - "grad_norm": 0.3655266761779785, - "learning_rate": 0.00014266666666666667, - "loss": 0.0164, - "step": 180 - }, - { - "epoch": 19.0, - "grad_norm": 0.08258651196956635, - "learning_rate": 0.00013822222222222222, - "loss": 0.013, - "step": 190 - }, - { - "epoch": 20.0, - "grad_norm": 0.1830163151025772, - "learning_rate": 0.00013377777777777777, - "loss": 0.0126, - "step": 200 - }, - { - "epoch": 20.0, - "eval_loss": 1.0726474523544312, - "eval_runtime": 1.7657, - "eval_samples_per_second": 2.832, - "eval_steps_per_second": 2.832, - "step": 200 - } - ], - "logging_steps": 10, - "max_steps": 500, - "num_input_tokens_seen": 0, - "num_train_epochs": 50, - "save_steps": 100, - "stateful_callbacks": { - "TrainerControl": { - "args": { - "should_epoch_stop": false, - "should_evaluate": false, - "should_log": false, - "should_save": true, - "should_training_stop": false - }, - "attributes": {} - } - }, - "total_flos": 2.655100782772224e+16, - "train_batch_size": 1, - "trial_name": null, - "trial_params": null -} diff --git a/checkpoint-200/training_args.bin b/checkpoint-200/training_args.bin deleted file mode 100644 index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000 --- a/checkpoint-200/training_args.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f -size 5777 diff --git a/checkpoint-300/README.md b/checkpoint-300/README.md deleted file mode 100644 index da869e54abd54b0fea18dcc9516b16918f684370..0000000000000000000000000000000000000000 --- a/checkpoint-300/README.md +++ /dev/null @@ -1,207 +0,0 @@ ---- -base_model: meta-llama/Llama-3.2-3B-Instruct -library_name: peft -pipeline_tag: text-generation -tags: -- base_model:adapter:meta-llama/Llama-3.2-3B-Instruct -- lora -- transformers ---- - -# Model Card for Model ID - - - - - -## Model Details - -### Model Description - - - - - -- **Developed by:** [More Information Needed] -- **Funded by [optional]:** [More Information Needed] -- **Shared by [optional]:** [More Information Needed] -- **Model type:** [More Information Needed] -- **Language(s) (NLP):** [More Information Needed] -- **License:** [More Information Needed] -- **Finetuned from model [optional]:** [More Information Needed] - -### Model Sources [optional] - - - -- **Repository:** [More Information Needed] -- **Paper [optional]:** [More Information Needed] -- **Demo [optional]:** [More Information Needed] - -## Uses - - - -### Direct Use - - - -[More Information Needed] - -### Downstream Use [optional] - - - -[More Information Needed] - -### Out-of-Scope Use - - - -[More Information Needed] - -## Bias, Risks, and Limitations - - - -[More Information Needed] - -### Recommendations - - - -Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. - -## How to Get Started with the Model - -Use the code below to get started with the model. - -[More Information Needed] - -## Training Details - -### Training Data - - - -[More Information Needed] - -### Training Procedure - - - -#### Preprocessing [optional] - -[More Information Needed] - - -#### Training Hyperparameters - -- **Training regime:** [More Information Needed] - -#### Speeds, Sizes, Times [optional] - - - -[More Information Needed] - -## Evaluation - - - -### Testing Data, Factors & Metrics - -#### Testing Data - - - -[More Information Needed] - -#### Factors - - - -[More Information Needed] - -#### Metrics - - - -[More Information Needed] - -### Results - -[More Information Needed] - -#### Summary - - - -## Model Examination [optional] - - - -[More Information Needed] - -## Environmental Impact - - - -Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). - -- **Hardware Type:** [More Information Needed] -- **Hours used:** [More Information Needed] -- **Cloud Provider:** [More Information Needed] -- **Compute Region:** [More Information Needed] -- **Carbon Emitted:** [More Information Needed] - -## Technical Specifications [optional] - -### Model Architecture and Objective - -[More Information Needed] - -### Compute Infrastructure - -[More Information Needed] - -#### Hardware - -[More Information Needed] - -#### Software - -[More Information Needed] - -## Citation [optional] - - - -**BibTeX:** - -[More Information Needed] - -**APA:** - -[More Information Needed] - -## Glossary [optional] - - - -[More Information Needed] - -## More Information [optional] - -[More Information Needed] - -## Model Card Authors [optional] - -[More Information Needed] - -## Model Card Contact - -[More Information Needed] -### Framework versions - -- PEFT 0.17.1 \ No newline at end of file diff --git a/checkpoint-300/adapter_config.json b/checkpoint-300/adapter_config.json deleted file mode 100644 index c9a27d527a89fd0081c994e17bd2b908b8038d6e..0000000000000000000000000000000000000000 --- a/checkpoint-300/adapter_config.json +++ /dev/null @@ -1,42 +0,0 @@ -{ - "alpha_pattern": {}, - "auto_mapping": null, - "base_model_name_or_path": "meta-llama/Llama-3.2-3B-Instruct", - "bias": "none", - "corda_config": null, - "eva_config": null, - "exclude_modules": null, - "fan_in_fan_out": false, - "inference_mode": true, - "init_lora_weights": true, - "layer_replication": null, - "layers_pattern": null, - "layers_to_transform": null, - "loftq_config": {}, - "lora_alpha": 32, - "lora_bias": false, - "lora_dropout": 0.1, - "megatron_config": null, - "megatron_core": "megatron.core", - "modules_to_save": null, - "peft_type": "LORA", - "qalora_group_size": 16, - "r": 16, - "rank_pattern": {}, - "revision": null, - "target_modules": [ - "down_proj", - "v_proj", - "q_proj", - "k_proj", - "gate_proj", - "o_proj", - "up_proj" - ], - "target_parameters": null, - "task_type": "CAUSAL_LM", - "trainable_token_indices": null, - "use_dora": false, - "use_qalora": false, - "use_rslora": false -} \ No newline at end of file diff --git a/checkpoint-300/adapter_model.safetensors b/checkpoint-300/adapter_model.safetensors deleted file mode 100644 index fa02e67ef636431f3f1bd7bb50a45abc4d431e75..0000000000000000000000000000000000000000 --- a/checkpoint-300/adapter_model.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:14af55caa175ef52c41fa5f381b7e459ab1e20ca247f29b76a1731a7dbd687a1 -size 97307544 diff --git a/checkpoint-300/chat_template.jinja b/checkpoint-300/chat_template.jinja deleted file mode 100644 index 1bad6a0f648dccdbec523ca79ba90fbcfc806af0..0000000000000000000000000000000000000000 --- a/checkpoint-300/chat_template.jinja +++ /dev/null @@ -1,93 +0,0 @@ -{{- bos_token }} -{%- if custom_tools is defined %} - {%- set tools = custom_tools %} -{%- endif %} -{%- if not tools_in_user_message is defined %} - {%- set tools_in_user_message = true %} -{%- endif %} -{%- if not date_string is defined %} - {%- if strftime_now is defined %} - {%- set date_string = strftime_now("%d %b %Y") %} - {%- else %} - {%- set date_string = "26 Jul 2024" %} - {%- endif %} -{%- endif %} -{%- if not tools is defined %} - {%- set tools = none %} -{%- endif %} - -{#- This block extracts the system message, so we can slot it into the right place. #} -{%- if messages[0]['role'] == 'system' %} - {%- set system_message = messages[0]['content']|trim %} - {%- set messages = messages[1:] %} -{%- else %} - {%- set system_message = "" %} -{%- endif %} - -{#- System message #} -{{- "<|start_header_id|>system<|end_header_id|>\n\n" }} -{%- if tools is not none %} - {{- "Environment: ipython\n" }} -{%- endif %} -{{- "Cutting Knowledge Date: December 2023\n" }} -{{- "Today Date: " + date_string + "\n\n" }} -{%- if tools is not none and not tools_in_user_message %} - {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }} - {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} - {{- "Do not use variables.\n\n" }} - {%- for t in tools %} - {{- t | tojson(indent=4) }} - {{- "\n\n" }} - {%- endfor %} -{%- endif %} -{{- system_message }} -{{- "<|eot_id|>" }} - -{#- Custom tools are passed in a user message with some extra guidance #} -{%- if tools_in_user_message and not tools is none %} - {#- Extract the first user message so we can plug it in here #} - {%- if messages | length != 0 %} - {%- set first_user_message = messages[0]['content']|trim %} - {%- set messages = messages[1:] %} - {%- else %} - {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }} -{%- endif %} - {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}} - {{- "Given the following functions, please respond with a JSON for a function call " }} - {{- "with its proper arguments that best answers the given prompt.\n\n" }} - {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} - {{- "Do not use variables.\n\n" }} - {%- for t in tools %} - {{- t | tojson(indent=4) }} - {{- "\n\n" }} - {%- endfor %} - {{- first_user_message + "<|eot_id|>"}} -{%- endif %} - -{%- for message in messages %} - {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %} - {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }} - {%- elif 'tool_calls' in message %} - {%- if not message.tool_calls|length == 1 %} - {{- raise_exception("This model only supports single tool-calls at once!") }} - {%- endif %} - {%- set tool_call = message.tool_calls[0].function %} - {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}} - {{- '{"name": "' + tool_call.name + '", ' }} - {{- '"parameters": ' }} - {{- tool_call.arguments | tojson }} - {{- "}" }} - {{- "<|eot_id|>" }} - {%- elif message.role == "tool" or message.role == "ipython" %} - {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }} - {%- if message.content is mapping or message.content is iterable %} - {{- message.content | tojson }} - {%- else %} - {{- message.content }} - {%- endif %} - {{- "<|eot_id|>" }} - {%- endif %} -{%- endfor %} -{%- if add_generation_prompt %} - {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }} -{%- endif %} diff --git a/checkpoint-300/optimizer.pt b/checkpoint-300/optimizer.pt deleted file mode 100644 index fbe8a79cd43aa475b2625c579adcaf7b916880ea..0000000000000000000000000000000000000000 --- a/checkpoint-300/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:11a8648049805bd21b4256f97311f1c7e5d02c1a70b65f964c5bf4c6bbea76db -size 194846331 diff --git a/checkpoint-300/rng_state.pth b/checkpoint-300/rng_state.pth deleted file mode 100644 index f9d54aec27333781cf245af3b0d9f6021b912fd0..0000000000000000000000000000000000000000 --- a/checkpoint-300/rng_state.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fbeebc7cba55f82e50391dff743835517526f978147ac553bab00af14778c49f -size 14645 diff --git a/checkpoint-300/scaler.pt b/checkpoint-300/scaler.pt deleted file mode 100644 index 872dde653491aa0ae40076c2acf51d2ae74df8ca..0000000000000000000000000000000000000000 --- a/checkpoint-300/scaler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:30af866df24edce708e1eb20700878b402fa05707fa9bc5f332496baf440dbbb -size 1383 diff --git a/checkpoint-300/scheduler.pt b/checkpoint-300/scheduler.pt deleted file mode 100644 index f1c1f6fce8c95692de3ea5fa744ec3bb94beda20..0000000000000000000000000000000000000000 --- a/checkpoint-300/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ad080a2632c9b5ed3878ced74ddb263235bce94c1d8e5dcafc6c1256600d3693 -size 1465 diff --git a/checkpoint-300/special_tokens_map.json b/checkpoint-300/special_tokens_map.json deleted file mode 100644 index b43be96621d147110fb8a18b5776ec6e38516127..0000000000000000000000000000000000000000 --- a/checkpoint-300/special_tokens_map.json +++ /dev/null @@ -1,17 +0,0 @@ -{ - "bos_token": { - "content": "<|begin_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false - }, - "eos_token": { - "content": "<|eot_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false - }, - "pad_token": "<|eot_id|>" -} diff --git a/checkpoint-300/tokenizer.json b/checkpoint-300/tokenizer.json deleted file mode 100644 index 8e89913d63cf04862fcbf301032ee349780489f2..0000000000000000000000000000000000000000 --- a/checkpoint-300/tokenizer.json +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:912e72517f7521f3273166a7879fe54c52b397f8c48ea80f8f1ed794beb24c09 -size 17210184 diff --git a/checkpoint-300/tokenizer_config.json b/checkpoint-300/tokenizer_config.json deleted file mode 100644 index 3beeacc86a6ca3cae14ad3004263ab74a4bac07a..0000000000000000000000000000000000000000 --- a/checkpoint-300/tokenizer_config.json +++ /dev/null @@ -1,2063 +0,0 @@ -{ - "added_tokens_decoder": { - "128000": { - "content": "<|begin_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128001": { - "content": "<|end_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128002": { - "content": "<|reserved_special_token_0|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128003": { - "content": "<|reserved_special_token_1|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128004": { - "content": "<|finetune_right_pad_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128005": { - "content": "<|reserved_special_token_2|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128006": { - "content": "<|start_header_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128007": { - "content": "<|end_header_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128008": { - "content": "<|eom_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128009": { - "content": "<|eot_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128010": { - "content": "<|python_tag|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128011": { - "content": "<|reserved_special_token_3|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128012": { - "content": "<|reserved_special_token_4|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128013": { - "content": "<|reserved_special_token_5|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128014": { - "content": "<|reserved_special_token_6|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128015": { - "content": "<|reserved_special_token_7|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128016": { - "content": "<|reserved_special_token_8|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128017": { - "content": "<|reserved_special_token_9|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128018": { - "content": "<|reserved_special_token_10|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128019": { - "content": "<|reserved_special_token_11|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128020": { - "content": "<|reserved_special_token_12|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128021": { - "content": "<|reserved_special_token_13|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128022": { - "content": "<|reserved_special_token_14|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128023": { - "content": "<|reserved_special_token_15|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128024": { - "content": "<|reserved_special_token_16|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128025": { - "content": "<|reserved_special_token_17|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128026": { - "content": "<|reserved_special_token_18|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128027": { - "content": "<|reserved_special_token_19|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128028": { - "content": "<|reserved_special_token_20|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128029": { - "content": "<|reserved_special_token_21|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128030": { - "content": "<|reserved_special_token_22|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128031": { - "content": "<|reserved_special_token_23|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128032": { - "content": "<|reserved_special_token_24|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128033": { - "content": "<|reserved_special_token_25|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128034": { - "content": "<|reserved_special_token_26|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128035": { - "content": "<|reserved_special_token_27|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128036": { - "content": "<|reserved_special_token_28|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128037": { - "content": "<|reserved_special_token_29|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128038": { - "content": "<|reserved_special_token_30|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128039": { - "content": "<|reserved_special_token_31|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128040": { - "content": "<|reserved_special_token_32|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128041": { - "content": "<|reserved_special_token_33|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128042": { - "content": "<|reserved_special_token_34|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128043": { - "content": "<|reserved_special_token_35|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128044": { - "content": "<|reserved_special_token_36|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128045": { - "content": "<|reserved_special_token_37|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128046": { - "content": "<|reserved_special_token_38|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128047": { - "content": "<|reserved_special_token_39|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128048": { - "content": "<|reserved_special_token_40|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128049": { - "content": "<|reserved_special_token_41|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128050": { - "content": "<|reserved_special_token_42|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128051": { - "content": "<|reserved_special_token_43|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128052": { - "content": "<|reserved_special_token_44|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128053": { - "content": "<|reserved_special_token_45|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128054": { - "content": "<|reserved_special_token_46|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128055": { - "content": "<|reserved_special_token_47|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128056": { - "content": "<|reserved_special_token_48|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128057": { - "content": "<|reserved_special_token_49|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128058": { - "content": "<|reserved_special_token_50|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128059": { - "content": "<|reserved_special_token_51|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128060": { - "content": "<|reserved_special_token_52|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128061": { - "content": "<|reserved_special_token_53|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128062": { - "content": "<|reserved_special_token_54|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128063": { - "content": "<|reserved_special_token_55|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128064": { - "content": "<|reserved_special_token_56|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128065": { - "content": "<|reserved_special_token_57|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128066": { - "content": "<|reserved_special_token_58|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128067": { - "content": "<|reserved_special_token_59|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128068": { - "content": "<|reserved_special_token_60|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128069": { - "content": "<|reserved_special_token_61|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128070": { - "content": "<|reserved_special_token_62|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128071": { - "content": "<|reserved_special_token_63|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128072": { - "content": "<|reserved_special_token_64|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128073": { - "content": "<|reserved_special_token_65|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128074": { - "content": "<|reserved_special_token_66|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128075": { - "content": "<|reserved_special_token_67|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128076": { - "content": "<|reserved_special_token_68|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128077": { - "content": "<|reserved_special_token_69|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128078": { - "content": "<|reserved_special_token_70|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128079": { - "content": "<|reserved_special_token_71|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128080": { - "content": "<|reserved_special_token_72|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128081": { - "content": "<|reserved_special_token_73|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128082": { - "content": "<|reserved_special_token_74|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128083": { - "content": "<|reserved_special_token_75|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128084": { - "content": "<|reserved_special_token_76|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128085": { - "content": "<|reserved_special_token_77|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128086": { - "content": "<|reserved_special_token_78|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128087": { - "content": "<|reserved_special_token_79|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128088": { - "content": "<|reserved_special_token_80|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128089": { - "content": "<|reserved_special_token_81|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128090": { - "content": "<|reserved_special_token_82|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128091": { - "content": "<|reserved_special_token_83|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128092": { - "content": "<|reserved_special_token_84|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128093": { - "content": "<|reserved_special_token_85|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128094": { - "content": "<|reserved_special_token_86|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128095": { - "content": "<|reserved_special_token_87|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128096": { - "content": "<|reserved_special_token_88|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128097": { - "content": "<|reserved_special_token_89|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128098": { - "content": "<|reserved_special_token_90|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128099": { - "content": "<|reserved_special_token_91|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128100": { - "content": "<|reserved_special_token_92|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128101": { - "content": "<|reserved_special_token_93|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128102": { - "content": "<|reserved_special_token_94|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128103": { - "content": "<|reserved_special_token_95|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128104": { - "content": "<|reserved_special_token_96|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128105": { - "content": "<|reserved_special_token_97|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128106": { - "content": "<|reserved_special_token_98|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128107": { - "content": "<|reserved_special_token_99|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128108": { - "content": "<|reserved_special_token_100|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128109": { - "content": "<|reserved_special_token_101|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128110": { - "content": "<|reserved_special_token_102|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128111": { - "content": "<|reserved_special_token_103|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128112": { - "content": "<|reserved_special_token_104|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128113": { - "content": "<|reserved_special_token_105|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128114": { - "content": "<|reserved_special_token_106|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128115": { - "content": "<|reserved_special_token_107|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128116": { - "content": "<|reserved_special_token_108|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128117": { - "content": "<|reserved_special_token_109|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128118": { - "content": "<|reserved_special_token_110|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128119": { - "content": "<|reserved_special_token_111|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128120": { - "content": "<|reserved_special_token_112|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128121": { - "content": "<|reserved_special_token_113|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128122": { - "content": "<|reserved_special_token_114|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128123": { - "content": "<|reserved_special_token_115|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128124": { - "content": "<|reserved_special_token_116|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128125": { - "content": "<|reserved_special_token_117|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128126": { - "content": "<|reserved_special_token_118|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128127": { - "content": "<|reserved_special_token_119|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128128": { - "content": "<|reserved_special_token_120|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128129": { - "content": "<|reserved_special_token_121|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128130": { - "content": "<|reserved_special_token_122|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128131": { - "content": "<|reserved_special_token_123|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128132": { - "content": "<|reserved_special_token_124|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128133": { - "content": "<|reserved_special_token_125|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128134": { - "content": "<|reserved_special_token_126|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128135": { - "content": "<|reserved_special_token_127|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128136": { - "content": "<|reserved_special_token_128|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128137": { - "content": "<|reserved_special_token_129|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128138": { - "content": "<|reserved_special_token_130|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128139": { - "content": "<|reserved_special_token_131|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128140": { - "content": "<|reserved_special_token_132|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128141": { - "content": "<|reserved_special_token_133|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128142": { - "content": "<|reserved_special_token_134|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128143": { - "content": "<|reserved_special_token_135|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128144": { - "content": "<|reserved_special_token_136|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128145": { - "content": "<|reserved_special_token_137|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128146": { - "content": "<|reserved_special_token_138|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128147": { - "content": "<|reserved_special_token_139|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128148": { - "content": "<|reserved_special_token_140|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128149": { - "content": "<|reserved_special_token_141|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128150": { - "content": "<|reserved_special_token_142|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128151": { - "content": "<|reserved_special_token_143|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128152": { - "content": "<|reserved_special_token_144|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128153": { - "content": "<|reserved_special_token_145|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128154": { - "content": "<|reserved_special_token_146|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128155": { - "content": "<|reserved_special_token_147|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128156": { - "content": "<|reserved_special_token_148|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128157": { - "content": "<|reserved_special_token_149|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128158": { - "content": "<|reserved_special_token_150|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128159": { - "content": "<|reserved_special_token_151|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128160": { - "content": "<|reserved_special_token_152|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128161": { - "content": "<|reserved_special_token_153|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128162": { - "content": "<|reserved_special_token_154|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128163": { - "content": "<|reserved_special_token_155|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128164": { - "content": "<|reserved_special_token_156|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128165": { - "content": "<|reserved_special_token_157|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128166": { - "content": "<|reserved_special_token_158|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128167": { - "content": "<|reserved_special_token_159|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128168": { - "content": "<|reserved_special_token_160|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128169": { - "content": "<|reserved_special_token_161|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128170": { - "content": "<|reserved_special_token_162|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128171": { - "content": "<|reserved_special_token_163|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128172": { - "content": "<|reserved_special_token_164|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128173": { - "content": "<|reserved_special_token_165|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128174": { - "content": "<|reserved_special_token_166|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128175": { - "content": "<|reserved_special_token_167|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128176": { - "content": "<|reserved_special_token_168|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128177": { - "content": "<|reserved_special_token_169|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128178": { - "content": "<|reserved_special_token_170|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128179": { - "content": "<|reserved_special_token_171|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128180": { - "content": "<|reserved_special_token_172|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128181": { - "content": "<|reserved_special_token_173|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128182": { - "content": "<|reserved_special_token_174|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128183": { - "content": "<|reserved_special_token_175|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128184": { - "content": "<|reserved_special_token_176|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128185": { - "content": "<|reserved_special_token_177|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128186": { - "content": "<|reserved_special_token_178|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128187": { - "content": "<|reserved_special_token_179|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128188": { - "content": "<|reserved_special_token_180|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128189": { - "content": "<|reserved_special_token_181|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128190": { - "content": "<|reserved_special_token_182|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128191": { - "content": "<|reserved_special_token_183|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128192": { - "content": "<|reserved_special_token_184|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128193": { - "content": "<|reserved_special_token_185|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128194": { - "content": "<|reserved_special_token_186|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128195": { - "content": "<|reserved_special_token_187|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128196": { - "content": "<|reserved_special_token_188|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128197": { - "content": "<|reserved_special_token_189|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128198": { - "content": "<|reserved_special_token_190|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128199": { - "content": "<|reserved_special_token_191|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128200": { - "content": "<|reserved_special_token_192|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128201": { - "content": "<|reserved_special_token_193|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128202": { - "content": "<|reserved_special_token_194|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128203": { - "content": "<|reserved_special_token_195|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128204": { - "content": "<|reserved_special_token_196|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128205": { - "content": "<|reserved_special_token_197|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128206": { - "content": "<|reserved_special_token_198|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128207": { - "content": "<|reserved_special_token_199|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128208": { - "content": "<|reserved_special_token_200|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128209": { - "content": "<|reserved_special_token_201|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128210": { - "content": "<|reserved_special_token_202|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128211": { - "content": "<|reserved_special_token_203|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128212": { - "content": "<|reserved_special_token_204|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128213": { - "content": "<|reserved_special_token_205|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128214": { - "content": "<|reserved_special_token_206|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128215": { - "content": "<|reserved_special_token_207|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128216": { - "content": "<|reserved_special_token_208|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128217": { - "content": "<|reserved_special_token_209|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128218": { - "content": "<|reserved_special_token_210|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128219": { - "content": "<|reserved_special_token_211|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128220": { - "content": "<|reserved_special_token_212|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128221": { - "content": "<|reserved_special_token_213|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128222": { - "content": "<|reserved_special_token_214|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128223": { - "content": "<|reserved_special_token_215|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128224": { - "content": "<|reserved_special_token_216|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128225": { - "content": "<|reserved_special_token_217|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128226": { - "content": "<|reserved_special_token_218|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128227": { - "content": "<|reserved_special_token_219|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128228": { - "content": "<|reserved_special_token_220|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128229": { - "content": "<|reserved_special_token_221|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128230": { - "content": "<|reserved_special_token_222|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128231": { - "content": "<|reserved_special_token_223|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128232": { - "content": "<|reserved_special_token_224|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128233": { - "content": "<|reserved_special_token_225|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128234": { - "content": "<|reserved_special_token_226|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128235": { - "content": "<|reserved_special_token_227|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128236": { - "content": "<|reserved_special_token_228|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128237": { - "content": "<|reserved_special_token_229|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128238": { - "content": "<|reserved_special_token_230|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128239": { - "content": "<|reserved_special_token_231|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128240": { - "content": "<|reserved_special_token_232|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128241": { - "content": "<|reserved_special_token_233|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128242": { - "content": "<|reserved_special_token_234|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128243": { - "content": "<|reserved_special_token_235|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128244": { - "content": "<|reserved_special_token_236|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128245": { - "content": "<|reserved_special_token_237|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128246": { - "content": "<|reserved_special_token_238|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128247": { - "content": "<|reserved_special_token_239|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128248": { - "content": "<|reserved_special_token_240|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128249": { - "content": "<|reserved_special_token_241|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128250": { - "content": "<|reserved_special_token_242|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128251": { - "content": "<|reserved_special_token_243|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128252": { - "content": "<|reserved_special_token_244|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128253": { - "content": "<|reserved_special_token_245|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128254": { - "content": "<|reserved_special_token_246|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128255": { - "content": "<|reserved_special_token_247|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - } - }, - "bos_token": "<|begin_of_text|>", - "clean_up_tokenization_spaces": true, - "eos_token": "<|eot_id|>", - "extra_special_tokens": {}, - "model_input_names": [ - "input_ids", - "attention_mask" - ], - "model_max_length": 131072, - "pad_token": "<|eot_id|>", - "tokenizer_class": "PreTrainedTokenizerFast" -} diff --git a/checkpoint-300/trainer_state.json b/checkpoint-300/trainer_state.json deleted file mode 100644 index 19c01d505ad92122929d029d241bfd9151c6e278..0000000000000000000000000000000000000000 --- a/checkpoint-300/trainer_state.json +++ /dev/null @@ -1,292 +0,0 @@ -{ - "best_global_step": 50, - "best_metric": 0.7558398842811584, - "best_model_checkpoint": null, - "epoch": 30.0, - "eval_steps": 50, - "global_step": 300, - "is_hyper_param_search": false, - "is_local_process_zero": true, - "is_world_process_zero": true, - "log_history": [ - { - "epoch": 1.0, - "grad_norm": 1.4660576581954956, - "learning_rate": 3.6e-05, - "loss": 1.152, - "step": 10 - }, - { - "epoch": 2.0, - "grad_norm": 0.8749533295631409, - "learning_rate": 7.6e-05, - "loss": 1.0421, - "step": 20 - }, - { - "epoch": 3.0, - "grad_norm": 3.37060284614563, - "learning_rate": 0.000116, - "loss": 0.8539, - "step": 30 - }, - { - "epoch": 4.0, - "grad_norm": 1.5355278253555298, - "learning_rate": 0.00015600000000000002, - "loss": 0.5483, - "step": 40 - }, - { - "epoch": 5.0, - "grad_norm": 2.454838514328003, - "learning_rate": 0.000196, - "loss": 0.3736, - "step": 50 - }, - { - "epoch": 5.0, - "eval_loss": 0.7558398842811584, - "eval_runtime": 1.7227, - "eval_samples_per_second": 2.902, - "eval_steps_per_second": 2.902, - "step": 50 - }, - { - "epoch": 6.0, - "grad_norm": 3.676417827606201, - "learning_rate": 0.000196, - "loss": 0.2291, - "step": 60 - }, - { - "epoch": 7.0, - "grad_norm": 2.192375898361206, - "learning_rate": 0.00019155555555555554, - "loss": 0.1244, - "step": 70 - }, - { - "epoch": 8.0, - "grad_norm": 2.630005359649658, - "learning_rate": 0.00018711111111111112, - "loss": 0.0862, - "step": 80 - }, - { - "epoch": 9.0, - "grad_norm": 0.5021786093711853, - "learning_rate": 0.00018266666666666667, - "loss": 0.0614, - "step": 90 - }, - { - "epoch": 10.0, - "grad_norm": 0.38170942664146423, - "learning_rate": 0.00017822222222222222, - "loss": 0.0471, - "step": 100 - }, - { - "epoch": 10.0, - "eval_loss": 0.8806974291801453, - "eval_runtime": 1.7764, - "eval_samples_per_second": 2.815, - "eval_steps_per_second": 2.815, - "step": 100 - }, - { - "epoch": 11.0, - "grad_norm": 1.223647952079773, - "learning_rate": 0.0001737777777777778, - "loss": 0.0359, - "step": 110 - }, - { - "epoch": 12.0, - "grad_norm": 0.5452818870544434, - "learning_rate": 0.00016933333333333335, - "loss": 0.0289, - "step": 120 - }, - { - "epoch": 13.0, - "grad_norm": 0.19034886360168457, - "learning_rate": 0.0001648888888888889, - "loss": 0.029, - "step": 130 - }, - { - "epoch": 14.0, - "grad_norm": 0.7483140230178833, - "learning_rate": 0.00016044444444444445, - "loss": 0.0247, - "step": 140 - }, - { - "epoch": 15.0, - "grad_norm": 0.34800082445144653, - "learning_rate": 0.00015600000000000002, - "loss": 0.0193, - "step": 150 - }, - { - "epoch": 15.0, - "eval_loss": 0.9916993379592896, - "eval_runtime": 1.7667, - "eval_samples_per_second": 2.83, - "eval_steps_per_second": 2.83, - "step": 150 - }, - { - "epoch": 16.0, - "grad_norm": 0.24237586557865143, - "learning_rate": 0.00015155555555555557, - "loss": 0.0176, - "step": 160 - }, - { - "epoch": 17.0, - "grad_norm": 0.13607177138328552, - "learning_rate": 0.00014711111111111112, - "loss": 0.0131, - "step": 170 - }, - { - "epoch": 18.0, - "grad_norm": 0.3655266761779785, - "learning_rate": 0.00014266666666666667, - "loss": 0.0164, - "step": 180 - }, - { - "epoch": 19.0, - "grad_norm": 0.08258651196956635, - "learning_rate": 0.00013822222222222222, - "loss": 0.013, - "step": 190 - }, - { - "epoch": 20.0, - "grad_norm": 0.1830163151025772, - "learning_rate": 0.00013377777777777777, - "loss": 0.0126, - "step": 200 - }, - { - "epoch": 20.0, - "eval_loss": 1.0726474523544312, - "eval_runtime": 1.7657, - "eval_samples_per_second": 2.832, - "eval_steps_per_second": 2.832, - "step": 200 - }, - { - "epoch": 21.0, - "grad_norm": 0.12009257823228836, - "learning_rate": 0.00012933333333333332, - "loss": 0.0108, - "step": 210 - }, - { - "epoch": 22.0, - "grad_norm": 0.1172371432185173, - "learning_rate": 0.0001248888888888889, - "loss": 0.0122, - "step": 220 - }, - { - "epoch": 23.0, - "grad_norm": 0.14445751905441284, - "learning_rate": 0.00012044444444444445, - "loss": 0.0121, - "step": 230 - }, - { - "epoch": 24.0, - "grad_norm": 0.18198293447494507, - "learning_rate": 0.000116, - "loss": 0.0128, - "step": 240 - }, - { - "epoch": 25.0, - "grad_norm": 0.1562514454126358, - "learning_rate": 0.00011155555555555556, - "loss": 0.0117, - "step": 250 - }, - { - "epoch": 25.0, - "eval_loss": 1.106227159500122, - "eval_runtime": 1.7564, - "eval_samples_per_second": 2.847, - "eval_steps_per_second": 2.847, - "step": 250 - }, - { - "epoch": 26.0, - "grad_norm": 0.06052432581782341, - "learning_rate": 0.00010711111111111111, - "loss": 0.0123, - "step": 260 - }, - { - "epoch": 27.0, - "grad_norm": 0.03066837601363659, - "learning_rate": 0.00010266666666666666, - "loss": 0.0106, - "step": 270 - }, - { - "epoch": 28.0, - "grad_norm": 0.034792304039001465, - "learning_rate": 9.822222222222223e-05, - "loss": 0.0124, - "step": 280 - }, - { - "epoch": 29.0, - "grad_norm": 0.028368409723043442, - "learning_rate": 9.377777777777779e-05, - "loss": 0.0107, - "step": 290 - }, - { - "epoch": 30.0, - "grad_norm": 0.03258921578526497, - "learning_rate": 8.933333333333334e-05, - "loss": 0.0109, - "step": 300 - }, - { - "epoch": 30.0, - "eval_loss": 1.1306606531143188, - "eval_runtime": 1.7675, - "eval_samples_per_second": 2.829, - "eval_steps_per_second": 2.829, - "step": 300 - } - ], - "logging_steps": 10, - "max_steps": 500, - "num_input_tokens_seen": 0, - "num_train_epochs": 50, - "save_steps": 100, - "stateful_callbacks": { - "TrainerControl": { - "args": { - "should_epoch_stop": false, - "should_evaluate": false, - "should_log": false, - "should_save": true, - "should_training_stop": false - }, - "attributes": {} - } - }, - "total_flos": 3.982651174158336e+16, - "train_batch_size": 1, - "trial_name": null, - "trial_params": null -} diff --git a/checkpoint-300/training_args.bin b/checkpoint-300/training_args.bin deleted file mode 100644 index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000 --- a/checkpoint-300/training_args.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f -size 5777 diff --git a/checkpoint-400/README.md b/checkpoint-400/README.md deleted file mode 100644 index da869e54abd54b0fea18dcc9516b16918f684370..0000000000000000000000000000000000000000 --- a/checkpoint-400/README.md +++ /dev/null @@ -1,207 +0,0 @@ ---- -base_model: meta-llama/Llama-3.2-3B-Instruct -library_name: peft -pipeline_tag: text-generation -tags: -- base_model:adapter:meta-llama/Llama-3.2-3B-Instruct -- lora -- transformers ---- - -# Model Card for Model ID - - - - - -## Model Details - -### Model Description - - - - - -- **Developed by:** [More Information Needed] -- **Funded by [optional]:** [More Information Needed] -- **Shared by [optional]:** [More Information Needed] -- **Model type:** [More Information Needed] -- **Language(s) (NLP):** [More Information Needed] -- **License:** [More Information Needed] -- **Finetuned from model [optional]:** [More Information Needed] - -### Model Sources [optional] - - - -- **Repository:** [More Information Needed] -- **Paper [optional]:** [More Information Needed] -- **Demo [optional]:** [More Information Needed] - -## Uses - - - -### Direct Use - - - -[More Information Needed] - -### Downstream Use [optional] - - - -[More Information Needed] - -### Out-of-Scope Use - - - -[More Information Needed] - -## Bias, Risks, and Limitations - - - -[More Information Needed] - -### Recommendations - - - -Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. - -## How to Get Started with the Model - -Use the code below to get started with the model. - -[More Information Needed] - -## Training Details - -### Training Data - - - -[More Information Needed] - -### Training Procedure - - - -#### Preprocessing [optional] - -[More Information Needed] - - -#### Training Hyperparameters - -- **Training regime:** [More Information Needed] - -#### Speeds, Sizes, Times [optional] - - - -[More Information Needed] - -## Evaluation - - - -### Testing Data, Factors & Metrics - -#### Testing Data - - - -[More Information Needed] - -#### Factors - - - -[More Information Needed] - -#### Metrics - - - -[More Information Needed] - -### Results - -[More Information Needed] - -#### Summary - - - -## Model Examination [optional] - - - -[More Information Needed] - -## Environmental Impact - - - -Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). - -- **Hardware Type:** [More Information Needed] -- **Hours used:** [More Information Needed] -- **Cloud Provider:** [More Information Needed] -- **Compute Region:** [More Information Needed] -- **Carbon Emitted:** [More Information Needed] - -## Technical Specifications [optional] - -### Model Architecture and Objective - -[More Information Needed] - -### Compute Infrastructure - -[More Information Needed] - -#### Hardware - -[More Information Needed] - -#### Software - -[More Information Needed] - -## Citation [optional] - - - -**BibTeX:** - -[More Information Needed] - -**APA:** - -[More Information Needed] - -## Glossary [optional] - - - -[More Information Needed] - -## More Information [optional] - -[More Information Needed] - -## Model Card Authors [optional] - -[More Information Needed] - -## Model Card Contact - -[More Information Needed] -### Framework versions - -- PEFT 0.17.1 \ No newline at end of file diff --git a/checkpoint-400/adapter_config.json b/checkpoint-400/adapter_config.json deleted file mode 100644 index c9a27d527a89fd0081c994e17bd2b908b8038d6e..0000000000000000000000000000000000000000 --- a/checkpoint-400/adapter_config.json +++ /dev/null @@ -1,42 +0,0 @@ -{ - "alpha_pattern": {}, - "auto_mapping": null, - "base_model_name_or_path": "meta-llama/Llama-3.2-3B-Instruct", - "bias": "none", - "corda_config": null, - "eva_config": null, - "exclude_modules": null, - "fan_in_fan_out": false, - "inference_mode": true, - "init_lora_weights": true, - "layer_replication": null, - "layers_pattern": null, - "layers_to_transform": null, - "loftq_config": {}, - "lora_alpha": 32, - "lora_bias": false, - "lora_dropout": 0.1, - "megatron_config": null, - "megatron_core": "megatron.core", - "modules_to_save": null, - "peft_type": "LORA", - "qalora_group_size": 16, - "r": 16, - "rank_pattern": {}, - "revision": null, - "target_modules": [ - "down_proj", - "v_proj", - "q_proj", - "k_proj", - "gate_proj", - "o_proj", - "up_proj" - ], - "target_parameters": null, - "task_type": "CAUSAL_LM", - "trainable_token_indices": null, - "use_dora": false, - "use_qalora": false, - "use_rslora": false -} \ No newline at end of file diff --git a/checkpoint-400/adapter_model.safetensors b/checkpoint-400/adapter_model.safetensors deleted file mode 100644 index 2bdf98938412f41cdad1d039985e9ca6e4ae8cfc..0000000000000000000000000000000000000000 --- a/checkpoint-400/adapter_model.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b09ec477371bdfadd7438ffd8a17ffa23db183558c378efb88851aa2f0878c67 -size 97307544 diff --git a/checkpoint-400/chat_template.jinja b/checkpoint-400/chat_template.jinja deleted file mode 100644 index 1bad6a0f648dccdbec523ca79ba90fbcfc806af0..0000000000000000000000000000000000000000 --- a/checkpoint-400/chat_template.jinja +++ /dev/null @@ -1,93 +0,0 @@ -{{- bos_token }} -{%- if custom_tools is defined %} - {%- set tools = custom_tools %} -{%- endif %} -{%- if not tools_in_user_message is defined %} - {%- set tools_in_user_message = true %} -{%- endif %} -{%- if not date_string is defined %} - {%- if strftime_now is defined %} - {%- set date_string = strftime_now("%d %b %Y") %} - {%- else %} - {%- set date_string = "26 Jul 2024" %} - {%- endif %} -{%- endif %} -{%- if not tools is defined %} - {%- set tools = none %} -{%- endif %} - -{#- This block extracts the system message, so we can slot it into the right place. #} -{%- if messages[0]['role'] == 'system' %} - {%- set system_message = messages[0]['content']|trim %} - {%- set messages = messages[1:] %} -{%- else %} - {%- set system_message = "" %} -{%- endif %} - -{#- System message #} -{{- "<|start_header_id|>system<|end_header_id|>\n\n" }} -{%- if tools is not none %} - {{- "Environment: ipython\n" }} -{%- endif %} -{{- "Cutting Knowledge Date: December 2023\n" }} -{{- "Today Date: " + date_string + "\n\n" }} -{%- if tools is not none and not tools_in_user_message %} - {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }} - {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} - {{- "Do not use variables.\n\n" }} - {%- for t in tools %} - {{- t | tojson(indent=4) }} - {{- "\n\n" }} - {%- endfor %} -{%- endif %} -{{- system_message }} -{{- "<|eot_id|>" }} - -{#- Custom tools are passed in a user message with some extra guidance #} -{%- if tools_in_user_message and not tools is none %} - {#- Extract the first user message so we can plug it in here #} - {%- if messages | length != 0 %} - {%- set first_user_message = messages[0]['content']|trim %} - {%- set messages = messages[1:] %} - {%- else %} - {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }} -{%- endif %} - {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}} - {{- "Given the following functions, please respond with a JSON for a function call " }} - {{- "with its proper arguments that best answers the given prompt.\n\n" }} - {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} - {{- "Do not use variables.\n\n" }} - {%- for t in tools %} - {{- t | tojson(indent=4) }} - {{- "\n\n" }} - {%- endfor %} - {{- first_user_message + "<|eot_id|>"}} -{%- endif %} - -{%- for message in messages %} - {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %} - {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }} - {%- elif 'tool_calls' in message %} - {%- if not message.tool_calls|length == 1 %} - {{- raise_exception("This model only supports single tool-calls at once!") }} - {%- endif %} - {%- set tool_call = message.tool_calls[0].function %} - {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}} - {{- '{"name": "' + tool_call.name + '", ' }} - {{- '"parameters": ' }} - {{- tool_call.arguments | tojson }} - {{- "}" }} - {{- "<|eot_id|>" }} - {%- elif message.role == "tool" or message.role == "ipython" %} - {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }} - {%- if message.content is mapping or message.content is iterable %} - {{- message.content | tojson }} - {%- else %} - {{- message.content }} - {%- endif %} - {{- "<|eot_id|>" }} - {%- endif %} -{%- endfor %} -{%- if add_generation_prompt %} - {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }} -{%- endif %} diff --git a/checkpoint-400/optimizer.pt b/checkpoint-400/optimizer.pt deleted file mode 100644 index 4ba2f96b88a00a983fe9e9439f4f034f5cc2a620..0000000000000000000000000000000000000000 --- a/checkpoint-400/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1749edc7d7adb361c013e5d65cd9069566799ebea20c3ae8bb3e5eb9ea6d2514 -size 194846331 diff --git a/checkpoint-400/rng_state.pth b/checkpoint-400/rng_state.pth deleted file mode 100644 index 2606109424f937f1bc52c93bea33a5d97a80968f..0000000000000000000000000000000000000000 --- a/checkpoint-400/rng_state.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1d4b1ffec63a9c901fcbc38e47d8abd2121fc84af05caaa0e7adce9ba19650e1 -size 14645 diff --git a/checkpoint-400/scaler.pt b/checkpoint-400/scaler.pt deleted file mode 100644 index 0b0bfee2584fa7aba2e3ab882380cdc54add60e0..0000000000000000000000000000000000000000 --- a/checkpoint-400/scaler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:30858f23bcb22d0baef45bd4add9d6fa474141308c12653c706077b87d932e49 -size 1383 diff --git a/checkpoint-400/scheduler.pt b/checkpoint-400/scheduler.pt deleted file mode 100644 index b4e8cfd932581e913336ce2133d36088daa2c2a5..0000000000000000000000000000000000000000 --- a/checkpoint-400/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:aa8793d08d90abcd0fe6bf5d2eb9e6c925d0781705a129dc03f5ec30bc5e94ba -size 1465 diff --git a/checkpoint-400/special_tokens_map.json b/checkpoint-400/special_tokens_map.json deleted file mode 100644 index b43be96621d147110fb8a18b5776ec6e38516127..0000000000000000000000000000000000000000 --- a/checkpoint-400/special_tokens_map.json +++ /dev/null @@ -1,17 +0,0 @@ -{ - "bos_token": { - "content": "<|begin_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false - }, - "eos_token": { - "content": "<|eot_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false - }, - "pad_token": "<|eot_id|>" -} diff --git a/checkpoint-400/tokenizer.json b/checkpoint-400/tokenizer.json deleted file mode 100644 index 8e89913d63cf04862fcbf301032ee349780489f2..0000000000000000000000000000000000000000 --- a/checkpoint-400/tokenizer.json +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:912e72517f7521f3273166a7879fe54c52b397f8c48ea80f8f1ed794beb24c09 -size 17210184 diff --git a/checkpoint-400/tokenizer_config.json b/checkpoint-400/tokenizer_config.json deleted file mode 100644 index 3beeacc86a6ca3cae14ad3004263ab74a4bac07a..0000000000000000000000000000000000000000 --- a/checkpoint-400/tokenizer_config.json +++ /dev/null @@ -1,2063 +0,0 @@ -{ - "added_tokens_decoder": { - "128000": { - "content": "<|begin_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128001": { - "content": "<|end_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128002": { - "content": "<|reserved_special_token_0|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128003": { - "content": "<|reserved_special_token_1|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128004": { - "content": "<|finetune_right_pad_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128005": { - "content": "<|reserved_special_token_2|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128006": { - "content": "<|start_header_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128007": { - "content": "<|end_header_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128008": { - "content": "<|eom_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128009": { - "content": "<|eot_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128010": { - "content": "<|python_tag|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128011": { - "content": "<|reserved_special_token_3|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128012": { - "content": "<|reserved_special_token_4|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128013": { - "content": "<|reserved_special_token_5|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128014": { - "content": "<|reserved_special_token_6|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128015": { - "content": "<|reserved_special_token_7|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128016": { - "content": "<|reserved_special_token_8|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128017": { - "content": "<|reserved_special_token_9|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128018": { - "content": "<|reserved_special_token_10|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128019": { - "content": "<|reserved_special_token_11|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128020": { - "content": "<|reserved_special_token_12|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128021": { - "content": "<|reserved_special_token_13|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128022": { - "content": "<|reserved_special_token_14|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128023": { - "content": "<|reserved_special_token_15|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128024": { - "content": "<|reserved_special_token_16|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128025": { - "content": "<|reserved_special_token_17|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128026": { - "content": "<|reserved_special_token_18|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128027": { - "content": "<|reserved_special_token_19|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128028": { - "content": "<|reserved_special_token_20|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128029": { - "content": "<|reserved_special_token_21|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128030": { - "content": "<|reserved_special_token_22|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128031": { - "content": "<|reserved_special_token_23|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128032": { - "content": "<|reserved_special_token_24|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128033": { - "content": "<|reserved_special_token_25|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128034": { - "content": "<|reserved_special_token_26|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128035": { - "content": "<|reserved_special_token_27|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128036": { - "content": "<|reserved_special_token_28|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128037": { - "content": "<|reserved_special_token_29|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128038": { - "content": "<|reserved_special_token_30|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128039": { - "content": "<|reserved_special_token_31|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128040": { - "content": "<|reserved_special_token_32|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128041": { - "content": "<|reserved_special_token_33|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128042": { - "content": "<|reserved_special_token_34|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128043": { - "content": "<|reserved_special_token_35|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128044": { - "content": "<|reserved_special_token_36|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128045": { - "content": "<|reserved_special_token_37|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128046": { - "content": "<|reserved_special_token_38|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128047": { - "content": "<|reserved_special_token_39|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128048": { - "content": "<|reserved_special_token_40|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128049": { - "content": "<|reserved_special_token_41|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128050": { - "content": "<|reserved_special_token_42|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128051": { - "content": "<|reserved_special_token_43|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128052": { - "content": "<|reserved_special_token_44|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128053": { - "content": "<|reserved_special_token_45|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128054": { - "content": "<|reserved_special_token_46|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128055": { - "content": "<|reserved_special_token_47|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128056": { - "content": "<|reserved_special_token_48|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128057": { - "content": "<|reserved_special_token_49|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128058": { - "content": "<|reserved_special_token_50|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128059": { - "content": "<|reserved_special_token_51|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128060": { - "content": "<|reserved_special_token_52|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128061": { - "content": "<|reserved_special_token_53|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128062": { - "content": "<|reserved_special_token_54|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128063": { - "content": "<|reserved_special_token_55|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128064": { - "content": "<|reserved_special_token_56|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128065": { - "content": "<|reserved_special_token_57|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128066": { - "content": "<|reserved_special_token_58|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128067": { - "content": "<|reserved_special_token_59|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128068": { - "content": "<|reserved_special_token_60|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128069": { - "content": "<|reserved_special_token_61|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128070": { - "content": "<|reserved_special_token_62|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128071": { - "content": "<|reserved_special_token_63|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128072": { - "content": "<|reserved_special_token_64|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128073": { - "content": "<|reserved_special_token_65|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128074": { - "content": "<|reserved_special_token_66|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128075": { - "content": "<|reserved_special_token_67|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128076": { - "content": "<|reserved_special_token_68|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128077": { - "content": "<|reserved_special_token_69|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128078": { - "content": "<|reserved_special_token_70|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128079": { - "content": "<|reserved_special_token_71|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128080": { - "content": "<|reserved_special_token_72|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128081": { - "content": "<|reserved_special_token_73|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128082": { - "content": "<|reserved_special_token_74|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128083": { - "content": "<|reserved_special_token_75|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128084": { - "content": "<|reserved_special_token_76|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128085": { - "content": "<|reserved_special_token_77|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128086": { - "content": "<|reserved_special_token_78|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128087": { - "content": "<|reserved_special_token_79|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128088": { - "content": "<|reserved_special_token_80|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128089": { - "content": "<|reserved_special_token_81|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128090": { - "content": "<|reserved_special_token_82|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128091": { - "content": "<|reserved_special_token_83|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128092": { - "content": "<|reserved_special_token_84|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128093": { - "content": "<|reserved_special_token_85|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128094": { - "content": "<|reserved_special_token_86|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128095": { - "content": "<|reserved_special_token_87|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128096": { - "content": "<|reserved_special_token_88|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128097": { - "content": "<|reserved_special_token_89|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128098": { - "content": "<|reserved_special_token_90|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128099": { - "content": "<|reserved_special_token_91|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128100": { - "content": "<|reserved_special_token_92|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128101": { - "content": "<|reserved_special_token_93|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128102": { - "content": "<|reserved_special_token_94|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128103": { - "content": "<|reserved_special_token_95|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128104": { - "content": "<|reserved_special_token_96|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128105": { - "content": "<|reserved_special_token_97|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128106": { - "content": "<|reserved_special_token_98|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128107": { - "content": "<|reserved_special_token_99|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128108": { - "content": "<|reserved_special_token_100|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128109": { - "content": "<|reserved_special_token_101|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128110": { - "content": "<|reserved_special_token_102|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128111": { - "content": "<|reserved_special_token_103|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128112": { - "content": "<|reserved_special_token_104|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128113": { - "content": "<|reserved_special_token_105|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128114": { - "content": "<|reserved_special_token_106|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128115": { - "content": "<|reserved_special_token_107|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128116": { - "content": "<|reserved_special_token_108|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128117": { - "content": "<|reserved_special_token_109|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128118": { - "content": "<|reserved_special_token_110|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128119": { - "content": "<|reserved_special_token_111|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128120": { - "content": "<|reserved_special_token_112|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128121": { - "content": "<|reserved_special_token_113|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128122": { - "content": "<|reserved_special_token_114|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128123": { - "content": "<|reserved_special_token_115|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128124": { - "content": "<|reserved_special_token_116|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128125": { - "content": "<|reserved_special_token_117|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128126": { - "content": "<|reserved_special_token_118|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128127": { - "content": "<|reserved_special_token_119|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128128": { - "content": "<|reserved_special_token_120|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128129": { - "content": "<|reserved_special_token_121|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128130": { - "content": "<|reserved_special_token_122|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128131": { - "content": "<|reserved_special_token_123|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128132": { - "content": "<|reserved_special_token_124|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128133": { - "content": "<|reserved_special_token_125|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128134": { - "content": "<|reserved_special_token_126|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128135": { - "content": "<|reserved_special_token_127|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128136": { - "content": "<|reserved_special_token_128|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128137": { - "content": "<|reserved_special_token_129|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128138": { - "content": "<|reserved_special_token_130|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128139": { - "content": "<|reserved_special_token_131|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128140": { - "content": "<|reserved_special_token_132|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128141": { - "content": "<|reserved_special_token_133|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128142": { - "content": "<|reserved_special_token_134|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128143": { - "content": "<|reserved_special_token_135|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128144": { - "content": "<|reserved_special_token_136|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128145": { - "content": "<|reserved_special_token_137|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128146": { - "content": "<|reserved_special_token_138|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128147": { - "content": "<|reserved_special_token_139|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128148": { - "content": "<|reserved_special_token_140|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128149": { - "content": "<|reserved_special_token_141|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128150": { - "content": "<|reserved_special_token_142|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128151": { - "content": "<|reserved_special_token_143|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128152": { - "content": "<|reserved_special_token_144|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128153": { - "content": "<|reserved_special_token_145|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128154": { - "content": "<|reserved_special_token_146|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128155": { - "content": "<|reserved_special_token_147|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128156": { - "content": "<|reserved_special_token_148|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128157": { - "content": "<|reserved_special_token_149|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128158": { - "content": "<|reserved_special_token_150|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128159": { - "content": "<|reserved_special_token_151|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128160": { - "content": "<|reserved_special_token_152|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128161": { - "content": "<|reserved_special_token_153|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128162": { - "content": "<|reserved_special_token_154|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128163": { - "content": "<|reserved_special_token_155|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128164": { - "content": "<|reserved_special_token_156|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128165": { - "content": "<|reserved_special_token_157|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128166": { - "content": "<|reserved_special_token_158|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128167": { - "content": "<|reserved_special_token_159|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128168": { - "content": "<|reserved_special_token_160|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128169": { - "content": "<|reserved_special_token_161|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128170": { - "content": "<|reserved_special_token_162|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128171": { - "content": "<|reserved_special_token_163|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128172": { - "content": "<|reserved_special_token_164|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128173": { - "content": "<|reserved_special_token_165|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128174": { - "content": "<|reserved_special_token_166|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128175": { - "content": "<|reserved_special_token_167|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128176": { - "content": "<|reserved_special_token_168|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128177": { - "content": "<|reserved_special_token_169|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128178": { - "content": "<|reserved_special_token_170|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128179": { - "content": "<|reserved_special_token_171|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128180": { - "content": "<|reserved_special_token_172|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128181": { - "content": "<|reserved_special_token_173|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128182": { - "content": "<|reserved_special_token_174|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128183": { - "content": "<|reserved_special_token_175|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128184": { - "content": "<|reserved_special_token_176|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128185": { - "content": "<|reserved_special_token_177|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128186": { - "content": "<|reserved_special_token_178|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128187": { - "content": "<|reserved_special_token_179|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128188": { - "content": "<|reserved_special_token_180|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128189": { - "content": "<|reserved_special_token_181|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128190": { - "content": "<|reserved_special_token_182|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128191": { - "content": "<|reserved_special_token_183|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128192": { - "content": "<|reserved_special_token_184|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128193": { - "content": "<|reserved_special_token_185|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128194": { - "content": "<|reserved_special_token_186|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128195": { - "content": "<|reserved_special_token_187|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128196": { - "content": "<|reserved_special_token_188|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128197": { - "content": "<|reserved_special_token_189|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128198": { - "content": "<|reserved_special_token_190|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128199": { - "content": "<|reserved_special_token_191|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128200": { - "content": "<|reserved_special_token_192|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128201": { - "content": "<|reserved_special_token_193|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128202": { - "content": "<|reserved_special_token_194|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128203": { - "content": "<|reserved_special_token_195|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128204": { - "content": "<|reserved_special_token_196|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128205": { - "content": "<|reserved_special_token_197|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128206": { - "content": "<|reserved_special_token_198|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128207": { - "content": "<|reserved_special_token_199|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128208": { - "content": "<|reserved_special_token_200|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128209": { - "content": "<|reserved_special_token_201|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128210": { - "content": "<|reserved_special_token_202|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128211": { - "content": "<|reserved_special_token_203|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128212": { - "content": "<|reserved_special_token_204|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128213": { - "content": "<|reserved_special_token_205|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128214": { - "content": "<|reserved_special_token_206|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128215": { - "content": "<|reserved_special_token_207|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128216": { - "content": "<|reserved_special_token_208|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128217": { - "content": "<|reserved_special_token_209|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128218": { - "content": "<|reserved_special_token_210|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128219": { - "content": "<|reserved_special_token_211|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128220": { - "content": "<|reserved_special_token_212|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128221": { - "content": "<|reserved_special_token_213|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128222": { - "content": "<|reserved_special_token_214|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128223": { - "content": "<|reserved_special_token_215|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128224": { - "content": "<|reserved_special_token_216|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128225": { - "content": "<|reserved_special_token_217|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128226": { - "content": "<|reserved_special_token_218|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128227": { - "content": "<|reserved_special_token_219|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128228": { - "content": "<|reserved_special_token_220|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128229": { - "content": "<|reserved_special_token_221|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128230": { - "content": "<|reserved_special_token_222|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128231": { - "content": "<|reserved_special_token_223|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128232": { - "content": "<|reserved_special_token_224|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128233": { - "content": "<|reserved_special_token_225|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128234": { - "content": "<|reserved_special_token_226|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128235": { - "content": "<|reserved_special_token_227|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128236": { - "content": "<|reserved_special_token_228|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128237": { - "content": "<|reserved_special_token_229|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128238": { - "content": "<|reserved_special_token_230|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128239": { - "content": "<|reserved_special_token_231|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128240": { - "content": "<|reserved_special_token_232|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128241": { - "content": "<|reserved_special_token_233|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128242": { - "content": "<|reserved_special_token_234|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128243": { - "content": "<|reserved_special_token_235|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128244": { - "content": "<|reserved_special_token_236|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128245": { - "content": "<|reserved_special_token_237|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128246": { - "content": "<|reserved_special_token_238|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128247": { - "content": "<|reserved_special_token_239|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128248": { - "content": "<|reserved_special_token_240|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128249": { - "content": "<|reserved_special_token_241|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128250": { - "content": "<|reserved_special_token_242|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128251": { - "content": "<|reserved_special_token_243|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128252": { - "content": "<|reserved_special_token_244|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128253": { - "content": "<|reserved_special_token_245|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128254": { - "content": "<|reserved_special_token_246|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128255": { - "content": "<|reserved_special_token_247|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - } - }, - "bos_token": "<|begin_of_text|>", - "clean_up_tokenization_spaces": true, - "eos_token": "<|eot_id|>", - "extra_special_tokens": {}, - "model_input_names": [ - "input_ids", - "attention_mask" - ], - "model_max_length": 131072, - "pad_token": "<|eot_id|>", - "tokenizer_class": "PreTrainedTokenizerFast" -} diff --git a/checkpoint-400/trainer_state.json b/checkpoint-400/trainer_state.json deleted file mode 100644 index 8536662e55d0228157dd159213a8d1ed7bf29eea..0000000000000000000000000000000000000000 --- a/checkpoint-400/trainer_state.json +++ /dev/null @@ -1,378 +0,0 @@ -{ - "best_global_step": 50, - "best_metric": 0.7558398842811584, - "best_model_checkpoint": null, - "epoch": 40.0, - "eval_steps": 50, - "global_step": 400, - "is_hyper_param_search": false, - "is_local_process_zero": true, - "is_world_process_zero": true, - "log_history": [ - { - "epoch": 1.0, - "grad_norm": 1.4660576581954956, - "learning_rate": 3.6e-05, - "loss": 1.152, - "step": 10 - }, - { - "epoch": 2.0, - "grad_norm": 0.8749533295631409, - "learning_rate": 7.6e-05, - "loss": 1.0421, - "step": 20 - }, - { - "epoch": 3.0, - "grad_norm": 3.37060284614563, - "learning_rate": 0.000116, - "loss": 0.8539, - "step": 30 - }, - { - "epoch": 4.0, - "grad_norm": 1.5355278253555298, - "learning_rate": 0.00015600000000000002, - "loss": 0.5483, - "step": 40 - }, - { - "epoch": 5.0, - "grad_norm": 2.454838514328003, - "learning_rate": 0.000196, - "loss": 0.3736, - "step": 50 - }, - { - "epoch": 5.0, - "eval_loss": 0.7558398842811584, - "eval_runtime": 1.7227, - "eval_samples_per_second": 2.902, - "eval_steps_per_second": 2.902, - "step": 50 - }, - { - "epoch": 6.0, - "grad_norm": 3.676417827606201, - "learning_rate": 0.000196, - "loss": 0.2291, - "step": 60 - }, - { - "epoch": 7.0, - "grad_norm": 2.192375898361206, - "learning_rate": 0.00019155555555555554, - "loss": 0.1244, - "step": 70 - }, - { - "epoch": 8.0, - "grad_norm": 2.630005359649658, - "learning_rate": 0.00018711111111111112, - "loss": 0.0862, - "step": 80 - }, - { - "epoch": 9.0, - "grad_norm": 0.5021786093711853, - "learning_rate": 0.00018266666666666667, - "loss": 0.0614, - "step": 90 - }, - { - "epoch": 10.0, - "grad_norm": 0.38170942664146423, - "learning_rate": 0.00017822222222222222, - "loss": 0.0471, - "step": 100 - }, - { - "epoch": 10.0, - "eval_loss": 0.8806974291801453, - "eval_runtime": 1.7764, - "eval_samples_per_second": 2.815, - "eval_steps_per_second": 2.815, - "step": 100 - }, - { - "epoch": 11.0, - "grad_norm": 1.223647952079773, - "learning_rate": 0.0001737777777777778, - "loss": 0.0359, - "step": 110 - }, - { - "epoch": 12.0, - "grad_norm": 0.5452818870544434, - "learning_rate": 0.00016933333333333335, - "loss": 0.0289, - "step": 120 - }, - { - "epoch": 13.0, - "grad_norm": 0.19034886360168457, - "learning_rate": 0.0001648888888888889, - "loss": 0.029, - "step": 130 - }, - { - "epoch": 14.0, - "grad_norm": 0.7483140230178833, - "learning_rate": 0.00016044444444444445, - "loss": 0.0247, - "step": 140 - }, - { - "epoch": 15.0, - "grad_norm": 0.34800082445144653, - "learning_rate": 0.00015600000000000002, - "loss": 0.0193, - "step": 150 - }, - { - "epoch": 15.0, - "eval_loss": 0.9916993379592896, - "eval_runtime": 1.7667, - "eval_samples_per_second": 2.83, - "eval_steps_per_second": 2.83, - "step": 150 - }, - { - "epoch": 16.0, - "grad_norm": 0.24237586557865143, - "learning_rate": 0.00015155555555555557, - "loss": 0.0176, - "step": 160 - }, - { - "epoch": 17.0, - "grad_norm": 0.13607177138328552, - "learning_rate": 0.00014711111111111112, - "loss": 0.0131, - "step": 170 - }, - { - "epoch": 18.0, - "grad_norm": 0.3655266761779785, - "learning_rate": 0.00014266666666666667, - "loss": 0.0164, - "step": 180 - }, - { - "epoch": 19.0, - "grad_norm": 0.08258651196956635, - "learning_rate": 0.00013822222222222222, - "loss": 0.013, - "step": 190 - }, - { - "epoch": 20.0, - "grad_norm": 0.1830163151025772, - "learning_rate": 0.00013377777777777777, - "loss": 0.0126, - "step": 200 - }, - { - "epoch": 20.0, - "eval_loss": 1.0726474523544312, - "eval_runtime": 1.7657, - "eval_samples_per_second": 2.832, - "eval_steps_per_second": 2.832, - "step": 200 - }, - { - "epoch": 21.0, - "grad_norm": 0.12009257823228836, - "learning_rate": 0.00012933333333333332, - "loss": 0.0108, - "step": 210 - }, - { - "epoch": 22.0, - "grad_norm": 0.1172371432185173, - "learning_rate": 0.0001248888888888889, - "loss": 0.0122, - "step": 220 - }, - { - "epoch": 23.0, - "grad_norm": 0.14445751905441284, - "learning_rate": 0.00012044444444444445, - "loss": 0.0121, - "step": 230 - }, - { - "epoch": 24.0, - "grad_norm": 0.18198293447494507, - "learning_rate": 0.000116, - "loss": 0.0128, - "step": 240 - }, - { - "epoch": 25.0, - "grad_norm": 0.1562514454126358, - "learning_rate": 0.00011155555555555556, - "loss": 0.0117, - "step": 250 - }, - { - "epoch": 25.0, - "eval_loss": 1.106227159500122, - "eval_runtime": 1.7564, - "eval_samples_per_second": 2.847, - "eval_steps_per_second": 2.847, - "step": 250 - }, - { - "epoch": 26.0, - "grad_norm": 0.06052432581782341, - "learning_rate": 0.00010711111111111111, - "loss": 0.0123, - "step": 260 - }, - { - "epoch": 27.0, - "grad_norm": 0.03066837601363659, - "learning_rate": 0.00010266666666666666, - "loss": 0.0106, - "step": 270 - }, - { - "epoch": 28.0, - "grad_norm": 0.034792304039001465, - "learning_rate": 9.822222222222223e-05, - "loss": 0.0124, - "step": 280 - }, - { - "epoch": 29.0, - "grad_norm": 0.028368409723043442, - "learning_rate": 9.377777777777779e-05, - "loss": 0.0107, - "step": 290 - }, - { - "epoch": 30.0, - "grad_norm": 0.03258921578526497, - "learning_rate": 8.933333333333334e-05, - "loss": 0.0109, - "step": 300 - }, - { - "epoch": 30.0, - "eval_loss": 1.1306606531143188, - "eval_runtime": 1.7675, - "eval_samples_per_second": 2.829, - "eval_steps_per_second": 2.829, - "step": 300 - }, - { - "epoch": 31.0, - "grad_norm": 0.26905232667922974, - "learning_rate": 8.488888888888889e-05, - "loss": 0.0131, - "step": 310 - }, - { - "epoch": 32.0, - "grad_norm": 0.15363195538520813, - "learning_rate": 8.044444444444444e-05, - "loss": 0.0121, - "step": 320 - }, - { - "epoch": 33.0, - "grad_norm": 0.030869223177433014, - "learning_rate": 7.6e-05, - "loss": 0.0104, - "step": 330 - }, - { - "epoch": 34.0, - "grad_norm": 0.07273676246404648, - "learning_rate": 7.155555555555555e-05, - "loss": 0.0112, - "step": 340 - }, - { - "epoch": 35.0, - "grad_norm": 0.025629112496972084, - "learning_rate": 6.711111111111112e-05, - "loss": 0.0121, - "step": 350 - }, - { - "epoch": 35.0, - "eval_loss": 1.128761887550354, - "eval_runtime": 1.7518, - "eval_samples_per_second": 2.854, - "eval_steps_per_second": 2.854, - "step": 350 - }, - { - "epoch": 36.0, - "grad_norm": 0.06929411739110947, - "learning_rate": 6.266666666666667e-05, - "loss": 0.0099, - "step": 360 - }, - { - "epoch": 37.0, - "grad_norm": 0.102758027613163, - "learning_rate": 5.8222222222222224e-05, - "loss": 0.0096, - "step": 370 - }, - { - "epoch": 38.0, - "grad_norm": 0.19261795282363892, - "learning_rate": 5.377777777777778e-05, - "loss": 0.0112, - "step": 380 - }, - { - "epoch": 39.0, - "grad_norm": 0.23121486604213715, - "learning_rate": 4.933333333333334e-05, - "loss": 0.0117, - "step": 390 - }, - { - "epoch": 40.0, - "grad_norm": 0.13266825675964355, - "learning_rate": 4.4888888888888894e-05, - "loss": 0.0113, - "step": 400 - }, - { - "epoch": 40.0, - "eval_loss": 1.1694066524505615, - "eval_runtime": 1.7708, - "eval_samples_per_second": 2.824, - "eval_steps_per_second": 2.824, - "step": 400 - } - ], - "logging_steps": 10, - "max_steps": 500, - "num_input_tokens_seen": 0, - "num_train_epochs": 50, - "save_steps": 100, - "stateful_callbacks": { - "TrainerControl": { - "args": { - "should_epoch_stop": false, - "should_evaluate": false, - "should_log": false, - "should_save": true, - "should_training_stop": false - }, - "attributes": {} - } - }, - "total_flos": 5.310201565544448e+16, - "train_batch_size": 1, - "trial_name": null, - "trial_params": null -} diff --git a/checkpoint-400/training_args.bin b/checkpoint-400/training_args.bin deleted file mode 100644 index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000 --- a/checkpoint-400/training_args.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f -size 5777 diff --git a/checkpoint-500/README.md b/checkpoint-500/README.md deleted file mode 100644 index da869e54abd54b0fea18dcc9516b16918f684370..0000000000000000000000000000000000000000 --- a/checkpoint-500/README.md +++ /dev/null @@ -1,207 +0,0 @@ ---- -base_model: meta-llama/Llama-3.2-3B-Instruct -library_name: peft -pipeline_tag: text-generation -tags: -- base_model:adapter:meta-llama/Llama-3.2-3B-Instruct -- lora -- transformers ---- - -# Model Card for Model ID - - - - - -## Model Details - -### Model Description - - - - - -- **Developed by:** [More Information Needed] -- **Funded by [optional]:** [More Information Needed] -- **Shared by [optional]:** [More Information Needed] -- **Model type:** [More Information Needed] -- **Language(s) (NLP):** [More Information Needed] -- **License:** [More Information Needed] -- **Finetuned from model [optional]:** [More Information Needed] - -### Model Sources [optional] - - - -- **Repository:** [More Information Needed] -- **Paper [optional]:** [More Information Needed] -- **Demo [optional]:** [More Information Needed] - -## Uses - - - -### Direct Use - - - -[More Information Needed] - -### Downstream Use [optional] - - - -[More Information Needed] - -### Out-of-Scope Use - - - -[More Information Needed] - -## Bias, Risks, and Limitations - - - -[More Information Needed] - -### Recommendations - - - -Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. - -## How to Get Started with the Model - -Use the code below to get started with the model. - -[More Information Needed] - -## Training Details - -### Training Data - - - -[More Information Needed] - -### Training Procedure - - - -#### Preprocessing [optional] - -[More Information Needed] - - -#### Training Hyperparameters - -- **Training regime:** [More Information Needed] - -#### Speeds, Sizes, Times [optional] - - - -[More Information Needed] - -## Evaluation - - - -### Testing Data, Factors & Metrics - -#### Testing Data - - - -[More Information Needed] - -#### Factors - - - -[More Information Needed] - -#### Metrics - - - -[More Information Needed] - -### Results - -[More Information Needed] - -#### Summary - - - -## Model Examination [optional] - - - -[More Information Needed] - -## Environmental Impact - - - -Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). - -- **Hardware Type:** [More Information Needed] -- **Hours used:** [More Information Needed] -- **Cloud Provider:** [More Information Needed] -- **Compute Region:** [More Information Needed] -- **Carbon Emitted:** [More Information Needed] - -## Technical Specifications [optional] - -### Model Architecture and Objective - -[More Information Needed] - -### Compute Infrastructure - -[More Information Needed] - -#### Hardware - -[More Information Needed] - -#### Software - -[More Information Needed] - -## Citation [optional] - - - -**BibTeX:** - -[More Information Needed] - -**APA:** - -[More Information Needed] - -## Glossary [optional] - - - -[More Information Needed] - -## More Information [optional] - -[More Information Needed] - -## Model Card Authors [optional] - -[More Information Needed] - -## Model Card Contact - -[More Information Needed] -### Framework versions - -- PEFT 0.17.1 \ No newline at end of file diff --git a/checkpoint-500/adapter_config.json b/checkpoint-500/adapter_config.json deleted file mode 100644 index c9a27d527a89fd0081c994e17bd2b908b8038d6e..0000000000000000000000000000000000000000 --- a/checkpoint-500/adapter_config.json +++ /dev/null @@ -1,42 +0,0 @@ -{ - "alpha_pattern": {}, - "auto_mapping": null, - "base_model_name_or_path": "meta-llama/Llama-3.2-3B-Instruct", - "bias": "none", - "corda_config": null, - "eva_config": null, - "exclude_modules": null, - "fan_in_fan_out": false, - "inference_mode": true, - "init_lora_weights": true, - "layer_replication": null, - "layers_pattern": null, - "layers_to_transform": null, - "loftq_config": {}, - "lora_alpha": 32, - "lora_bias": false, - "lora_dropout": 0.1, - "megatron_config": null, - "megatron_core": "megatron.core", - "modules_to_save": null, - "peft_type": "LORA", - "qalora_group_size": 16, - "r": 16, - "rank_pattern": {}, - "revision": null, - "target_modules": [ - "down_proj", - "v_proj", - "q_proj", - "k_proj", - "gate_proj", - "o_proj", - "up_proj" - ], - "target_parameters": null, - "task_type": "CAUSAL_LM", - "trainable_token_indices": null, - "use_dora": false, - "use_qalora": false, - "use_rslora": false -} \ No newline at end of file diff --git a/checkpoint-500/adapter_model.safetensors b/checkpoint-500/adapter_model.safetensors deleted file mode 100644 index 7a9846a96572118b10e28d68186ff4d9910f14c8..0000000000000000000000000000000000000000 --- a/checkpoint-500/adapter_model.safetensors +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f1267898d59499b11e00e1bb133bce956e6ae4d0f5e56bc474251ec2c869df0e -size 97307544 diff --git a/checkpoint-500/chat_template.jinja b/checkpoint-500/chat_template.jinja deleted file mode 100644 index 1bad6a0f648dccdbec523ca79ba90fbcfc806af0..0000000000000000000000000000000000000000 --- a/checkpoint-500/chat_template.jinja +++ /dev/null @@ -1,93 +0,0 @@ -{{- bos_token }} -{%- if custom_tools is defined %} - {%- set tools = custom_tools %} -{%- endif %} -{%- if not tools_in_user_message is defined %} - {%- set tools_in_user_message = true %} -{%- endif %} -{%- if not date_string is defined %} - {%- if strftime_now is defined %} - {%- set date_string = strftime_now("%d %b %Y") %} - {%- else %} - {%- set date_string = "26 Jul 2024" %} - {%- endif %} -{%- endif %} -{%- if not tools is defined %} - {%- set tools = none %} -{%- endif %} - -{#- This block extracts the system message, so we can slot it into the right place. #} -{%- if messages[0]['role'] == 'system' %} - {%- set system_message = messages[0]['content']|trim %} - {%- set messages = messages[1:] %} -{%- else %} - {%- set system_message = "" %} -{%- endif %} - -{#- System message #} -{{- "<|start_header_id|>system<|end_header_id|>\n\n" }} -{%- if tools is not none %} - {{- "Environment: ipython\n" }} -{%- endif %} -{{- "Cutting Knowledge Date: December 2023\n" }} -{{- "Today Date: " + date_string + "\n\n" }} -{%- if tools is not none and not tools_in_user_message %} - {{- "You have access to the following functions. To call a function, please respond with JSON for a function call." }} - {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} - {{- "Do not use variables.\n\n" }} - {%- for t in tools %} - {{- t | tojson(indent=4) }} - {{- "\n\n" }} - {%- endfor %} -{%- endif %} -{{- system_message }} -{{- "<|eot_id|>" }} - -{#- Custom tools are passed in a user message with some extra guidance #} -{%- if tools_in_user_message and not tools is none %} - {#- Extract the first user message so we can plug it in here #} - {%- if messages | length != 0 %} - {%- set first_user_message = messages[0]['content']|trim %} - {%- set messages = messages[1:] %} - {%- else %} - {{- raise_exception("Cannot put tools in the first user message when there's no first user message!") }} -{%- endif %} - {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}} - {{- "Given the following functions, please respond with a JSON for a function call " }} - {{- "with its proper arguments that best answers the given prompt.\n\n" }} - {{- 'Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}.' }} - {{- "Do not use variables.\n\n" }} - {%- for t in tools %} - {{- t | tojson(indent=4) }} - {{- "\n\n" }} - {%- endfor %} - {{- first_user_message + "<|eot_id|>"}} -{%- endif %} - -{%- for message in messages %} - {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %} - {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }} - {%- elif 'tool_calls' in message %} - {%- if not message.tool_calls|length == 1 %} - {{- raise_exception("This model only supports single tool-calls at once!") }} - {%- endif %} - {%- set tool_call = message.tool_calls[0].function %} - {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}} - {{- '{"name": "' + tool_call.name + '", ' }} - {{- '"parameters": ' }} - {{- tool_call.arguments | tojson }} - {{- "}" }} - {{- "<|eot_id|>" }} - {%- elif message.role == "tool" or message.role == "ipython" %} - {{- "<|start_header_id|>ipython<|end_header_id|>\n\n" }} - {%- if message.content is mapping or message.content is iterable %} - {{- message.content | tojson }} - {%- else %} - {{- message.content }} - {%- endif %} - {{- "<|eot_id|>" }} - {%- endif %} -{%- endfor %} -{%- if add_generation_prompt %} - {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }} -{%- endif %} diff --git a/checkpoint-500/optimizer.pt b/checkpoint-500/optimizer.pt deleted file mode 100644 index f7c2398a130ab9ffd8b90defabe5571440bc8cc1..0000000000000000000000000000000000000000 --- a/checkpoint-500/optimizer.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:364e4794f5e5265e6208ffb91534397b3f81c0ffd11eb1f70e677b82917cd811 -size 194846331 diff --git a/checkpoint-500/rng_state.pth b/checkpoint-500/rng_state.pth deleted file mode 100644 index 1ba3c4495fdbd5b478e34246759af0e667a57976..0000000000000000000000000000000000000000 --- a/checkpoint-500/rng_state.pth +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cbf17c6ea5a2364f5c121447c9554bb3437ed12ac00bd180e0c39823e3932887 -size 14645 diff --git a/checkpoint-500/scaler.pt b/checkpoint-500/scaler.pt deleted file mode 100644 index 86c857e8514e5db52a765434b135695dac4c9c36..0000000000000000000000000000000000000000 --- a/checkpoint-500/scaler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f77569c2e850b04af982cc8c1389f1430851448915c593b69e5da36ce05b71d7 -size 1383 diff --git a/checkpoint-500/scheduler.pt b/checkpoint-500/scheduler.pt deleted file mode 100644 index 7d406056d4209a0bc88bb800efa5129731063e3b..0000000000000000000000000000000000000000 --- a/checkpoint-500/scheduler.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5fc3f7ed409df14d1c62e690e63b0c5e5d89499208bb0e61ef44ccedc3f1d40a -size 1465 diff --git a/checkpoint-500/special_tokens_map.json b/checkpoint-500/special_tokens_map.json deleted file mode 100644 index b43be96621d147110fb8a18b5776ec6e38516127..0000000000000000000000000000000000000000 --- a/checkpoint-500/special_tokens_map.json +++ /dev/null @@ -1,17 +0,0 @@ -{ - "bos_token": { - "content": "<|begin_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false - }, - "eos_token": { - "content": "<|eot_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false - }, - "pad_token": "<|eot_id|>" -} diff --git a/checkpoint-500/tokenizer.json b/checkpoint-500/tokenizer.json deleted file mode 100644 index 8e89913d63cf04862fcbf301032ee349780489f2..0000000000000000000000000000000000000000 --- a/checkpoint-500/tokenizer.json +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:912e72517f7521f3273166a7879fe54c52b397f8c48ea80f8f1ed794beb24c09 -size 17210184 diff --git a/checkpoint-500/tokenizer_config.json b/checkpoint-500/tokenizer_config.json deleted file mode 100644 index 3beeacc86a6ca3cae14ad3004263ab74a4bac07a..0000000000000000000000000000000000000000 --- a/checkpoint-500/tokenizer_config.json +++ /dev/null @@ -1,2063 +0,0 @@ -{ - "added_tokens_decoder": { - "128000": { - "content": "<|begin_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128001": { - "content": "<|end_of_text|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128002": { - "content": "<|reserved_special_token_0|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128003": { - "content": "<|reserved_special_token_1|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128004": { - "content": "<|finetune_right_pad_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128005": { - "content": "<|reserved_special_token_2|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128006": { - "content": "<|start_header_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128007": { - "content": "<|end_header_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128008": { - "content": "<|eom_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128009": { - "content": "<|eot_id|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128010": { - "content": "<|python_tag|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128011": { - "content": "<|reserved_special_token_3|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128012": { - "content": "<|reserved_special_token_4|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128013": { - "content": "<|reserved_special_token_5|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128014": { - "content": "<|reserved_special_token_6|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128015": { - "content": "<|reserved_special_token_7|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128016": { - "content": "<|reserved_special_token_8|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128017": { - "content": "<|reserved_special_token_9|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128018": { - "content": "<|reserved_special_token_10|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128019": { - "content": "<|reserved_special_token_11|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128020": { - "content": "<|reserved_special_token_12|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128021": { - "content": "<|reserved_special_token_13|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128022": { - "content": "<|reserved_special_token_14|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128023": { - "content": "<|reserved_special_token_15|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128024": { - "content": "<|reserved_special_token_16|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128025": { - "content": "<|reserved_special_token_17|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128026": { - "content": "<|reserved_special_token_18|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128027": { - "content": "<|reserved_special_token_19|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128028": { - "content": "<|reserved_special_token_20|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128029": { - "content": "<|reserved_special_token_21|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128030": { - "content": "<|reserved_special_token_22|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128031": { - "content": "<|reserved_special_token_23|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128032": { - "content": "<|reserved_special_token_24|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128033": { - "content": "<|reserved_special_token_25|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128034": { - "content": "<|reserved_special_token_26|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128035": { - "content": "<|reserved_special_token_27|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128036": { - "content": "<|reserved_special_token_28|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128037": { - "content": "<|reserved_special_token_29|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128038": { - "content": "<|reserved_special_token_30|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128039": { - "content": "<|reserved_special_token_31|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128040": { - "content": "<|reserved_special_token_32|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128041": { - "content": "<|reserved_special_token_33|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128042": { - "content": "<|reserved_special_token_34|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128043": { - "content": "<|reserved_special_token_35|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128044": { - "content": "<|reserved_special_token_36|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128045": { - "content": "<|reserved_special_token_37|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128046": { - "content": "<|reserved_special_token_38|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128047": { - "content": "<|reserved_special_token_39|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128048": { - "content": "<|reserved_special_token_40|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128049": { - "content": "<|reserved_special_token_41|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128050": { - "content": "<|reserved_special_token_42|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128051": { - "content": "<|reserved_special_token_43|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128052": { - "content": "<|reserved_special_token_44|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128053": { - "content": "<|reserved_special_token_45|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128054": { - "content": "<|reserved_special_token_46|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128055": { - "content": "<|reserved_special_token_47|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128056": { - "content": "<|reserved_special_token_48|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128057": { - "content": "<|reserved_special_token_49|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128058": { - "content": "<|reserved_special_token_50|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128059": { - "content": "<|reserved_special_token_51|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128060": { - "content": "<|reserved_special_token_52|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128061": { - "content": "<|reserved_special_token_53|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128062": { - "content": "<|reserved_special_token_54|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128063": { - "content": "<|reserved_special_token_55|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128064": { - "content": "<|reserved_special_token_56|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128065": { - "content": "<|reserved_special_token_57|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128066": { - "content": "<|reserved_special_token_58|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128067": { - "content": "<|reserved_special_token_59|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128068": { - "content": "<|reserved_special_token_60|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128069": { - "content": "<|reserved_special_token_61|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128070": { - "content": "<|reserved_special_token_62|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128071": { - "content": "<|reserved_special_token_63|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128072": { - "content": "<|reserved_special_token_64|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128073": { - "content": "<|reserved_special_token_65|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128074": { - "content": "<|reserved_special_token_66|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128075": { - "content": "<|reserved_special_token_67|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128076": { - "content": "<|reserved_special_token_68|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128077": { - "content": "<|reserved_special_token_69|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128078": { - "content": "<|reserved_special_token_70|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128079": { - "content": "<|reserved_special_token_71|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128080": { - "content": "<|reserved_special_token_72|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128081": { - "content": "<|reserved_special_token_73|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128082": { - "content": "<|reserved_special_token_74|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128083": { - "content": "<|reserved_special_token_75|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128084": { - "content": "<|reserved_special_token_76|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128085": { - "content": "<|reserved_special_token_77|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128086": { - "content": "<|reserved_special_token_78|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128087": { - "content": "<|reserved_special_token_79|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128088": { - "content": "<|reserved_special_token_80|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128089": { - "content": "<|reserved_special_token_81|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128090": { - "content": "<|reserved_special_token_82|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128091": { - "content": "<|reserved_special_token_83|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128092": { - "content": "<|reserved_special_token_84|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128093": { - "content": "<|reserved_special_token_85|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128094": { - "content": "<|reserved_special_token_86|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128095": { - "content": "<|reserved_special_token_87|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128096": { - "content": "<|reserved_special_token_88|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128097": { - "content": "<|reserved_special_token_89|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128098": { - "content": "<|reserved_special_token_90|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128099": { - "content": "<|reserved_special_token_91|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128100": { - "content": "<|reserved_special_token_92|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128101": { - "content": "<|reserved_special_token_93|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128102": { - "content": "<|reserved_special_token_94|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128103": { - "content": "<|reserved_special_token_95|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128104": { - "content": "<|reserved_special_token_96|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128105": { - "content": "<|reserved_special_token_97|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128106": { - "content": "<|reserved_special_token_98|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128107": { - "content": "<|reserved_special_token_99|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128108": { - "content": "<|reserved_special_token_100|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128109": { - "content": "<|reserved_special_token_101|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128110": { - "content": "<|reserved_special_token_102|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128111": { - "content": "<|reserved_special_token_103|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128112": { - "content": "<|reserved_special_token_104|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128113": { - "content": "<|reserved_special_token_105|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128114": { - "content": "<|reserved_special_token_106|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128115": { - "content": "<|reserved_special_token_107|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128116": { - "content": "<|reserved_special_token_108|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128117": { - "content": "<|reserved_special_token_109|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128118": { - "content": "<|reserved_special_token_110|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128119": { - "content": "<|reserved_special_token_111|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128120": { - "content": "<|reserved_special_token_112|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128121": { - "content": "<|reserved_special_token_113|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128122": { - "content": "<|reserved_special_token_114|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128123": { - "content": "<|reserved_special_token_115|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128124": { - "content": "<|reserved_special_token_116|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128125": { - "content": "<|reserved_special_token_117|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128126": { - "content": "<|reserved_special_token_118|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128127": { - "content": "<|reserved_special_token_119|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128128": { - "content": "<|reserved_special_token_120|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128129": { - "content": "<|reserved_special_token_121|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128130": { - "content": "<|reserved_special_token_122|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128131": { - "content": "<|reserved_special_token_123|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128132": { - "content": "<|reserved_special_token_124|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128133": { - "content": "<|reserved_special_token_125|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128134": { - "content": "<|reserved_special_token_126|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128135": { - "content": "<|reserved_special_token_127|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128136": { - "content": "<|reserved_special_token_128|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128137": { - "content": "<|reserved_special_token_129|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128138": { - "content": "<|reserved_special_token_130|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128139": { - "content": "<|reserved_special_token_131|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128140": { - "content": "<|reserved_special_token_132|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128141": { - "content": "<|reserved_special_token_133|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128142": { - "content": "<|reserved_special_token_134|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128143": { - "content": "<|reserved_special_token_135|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128144": { - "content": "<|reserved_special_token_136|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128145": { - "content": "<|reserved_special_token_137|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128146": { - "content": "<|reserved_special_token_138|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128147": { - "content": "<|reserved_special_token_139|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128148": { - "content": "<|reserved_special_token_140|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128149": { - "content": "<|reserved_special_token_141|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128150": { - "content": "<|reserved_special_token_142|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128151": { - "content": "<|reserved_special_token_143|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128152": { - "content": "<|reserved_special_token_144|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128153": { - "content": "<|reserved_special_token_145|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128154": { - "content": "<|reserved_special_token_146|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128155": { - "content": "<|reserved_special_token_147|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128156": { - "content": "<|reserved_special_token_148|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128157": { - "content": "<|reserved_special_token_149|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128158": { - "content": "<|reserved_special_token_150|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128159": { - "content": "<|reserved_special_token_151|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128160": { - "content": "<|reserved_special_token_152|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128161": { - "content": "<|reserved_special_token_153|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128162": { - "content": "<|reserved_special_token_154|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128163": { - "content": "<|reserved_special_token_155|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128164": { - "content": "<|reserved_special_token_156|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128165": { - "content": "<|reserved_special_token_157|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128166": { - "content": "<|reserved_special_token_158|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128167": { - "content": "<|reserved_special_token_159|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128168": { - "content": "<|reserved_special_token_160|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128169": { - "content": "<|reserved_special_token_161|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128170": { - "content": "<|reserved_special_token_162|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128171": { - "content": "<|reserved_special_token_163|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128172": { - "content": "<|reserved_special_token_164|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128173": { - "content": "<|reserved_special_token_165|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128174": { - "content": "<|reserved_special_token_166|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128175": { - "content": "<|reserved_special_token_167|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128176": { - "content": "<|reserved_special_token_168|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128177": { - "content": "<|reserved_special_token_169|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128178": { - "content": "<|reserved_special_token_170|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128179": { - "content": "<|reserved_special_token_171|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128180": { - "content": "<|reserved_special_token_172|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128181": { - "content": "<|reserved_special_token_173|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128182": { - "content": "<|reserved_special_token_174|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128183": { - "content": "<|reserved_special_token_175|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128184": { - "content": "<|reserved_special_token_176|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128185": { - "content": "<|reserved_special_token_177|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128186": { - "content": "<|reserved_special_token_178|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128187": { - "content": "<|reserved_special_token_179|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128188": { - "content": "<|reserved_special_token_180|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128189": { - "content": "<|reserved_special_token_181|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128190": { - "content": "<|reserved_special_token_182|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128191": { - "content": "<|reserved_special_token_183|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128192": { - "content": "<|reserved_special_token_184|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128193": { - "content": "<|reserved_special_token_185|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128194": { - "content": "<|reserved_special_token_186|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128195": { - "content": "<|reserved_special_token_187|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128196": { - "content": "<|reserved_special_token_188|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128197": { - "content": "<|reserved_special_token_189|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128198": { - "content": "<|reserved_special_token_190|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128199": { - "content": "<|reserved_special_token_191|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128200": { - "content": "<|reserved_special_token_192|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128201": { - "content": "<|reserved_special_token_193|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128202": { - "content": "<|reserved_special_token_194|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128203": { - "content": "<|reserved_special_token_195|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128204": { - "content": "<|reserved_special_token_196|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128205": { - "content": "<|reserved_special_token_197|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128206": { - "content": "<|reserved_special_token_198|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128207": { - "content": "<|reserved_special_token_199|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128208": { - "content": "<|reserved_special_token_200|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128209": { - "content": "<|reserved_special_token_201|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128210": { - "content": "<|reserved_special_token_202|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128211": { - "content": "<|reserved_special_token_203|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128212": { - "content": "<|reserved_special_token_204|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128213": { - "content": "<|reserved_special_token_205|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128214": { - "content": "<|reserved_special_token_206|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128215": { - "content": "<|reserved_special_token_207|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128216": { - "content": "<|reserved_special_token_208|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128217": { - "content": "<|reserved_special_token_209|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128218": { - "content": "<|reserved_special_token_210|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128219": { - "content": "<|reserved_special_token_211|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128220": { - "content": "<|reserved_special_token_212|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128221": { - "content": "<|reserved_special_token_213|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128222": { - "content": "<|reserved_special_token_214|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128223": { - "content": "<|reserved_special_token_215|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128224": { - "content": "<|reserved_special_token_216|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128225": { - "content": "<|reserved_special_token_217|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128226": { - "content": "<|reserved_special_token_218|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128227": { - "content": "<|reserved_special_token_219|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128228": { - "content": "<|reserved_special_token_220|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128229": { - "content": "<|reserved_special_token_221|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128230": { - "content": "<|reserved_special_token_222|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128231": { - "content": "<|reserved_special_token_223|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128232": { - "content": "<|reserved_special_token_224|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128233": { - "content": "<|reserved_special_token_225|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128234": { - "content": "<|reserved_special_token_226|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128235": { - "content": "<|reserved_special_token_227|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128236": { - "content": "<|reserved_special_token_228|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128237": { - "content": "<|reserved_special_token_229|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128238": { - "content": "<|reserved_special_token_230|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128239": { - "content": "<|reserved_special_token_231|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128240": { - "content": "<|reserved_special_token_232|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128241": { - "content": "<|reserved_special_token_233|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128242": { - "content": "<|reserved_special_token_234|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128243": { - "content": "<|reserved_special_token_235|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128244": { - "content": "<|reserved_special_token_236|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128245": { - "content": "<|reserved_special_token_237|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128246": { - "content": "<|reserved_special_token_238|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128247": { - "content": "<|reserved_special_token_239|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128248": { - "content": "<|reserved_special_token_240|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128249": { - "content": "<|reserved_special_token_241|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128250": { - "content": "<|reserved_special_token_242|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128251": { - "content": "<|reserved_special_token_243|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128252": { - "content": "<|reserved_special_token_244|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128253": { - "content": "<|reserved_special_token_245|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128254": { - "content": "<|reserved_special_token_246|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - }, - "128255": { - "content": "<|reserved_special_token_247|>", - "lstrip": false, - "normalized": false, - "rstrip": false, - "single_word": false, - "special": true - } - }, - "bos_token": "<|begin_of_text|>", - "clean_up_tokenization_spaces": true, - "eos_token": "<|eot_id|>", - "extra_special_tokens": {}, - "model_input_names": [ - "input_ids", - "attention_mask" - ], - "model_max_length": 131072, - "pad_token": "<|eot_id|>", - "tokenizer_class": "PreTrainedTokenizerFast" -} diff --git a/checkpoint-500/trainer_state.json b/checkpoint-500/trainer_state.json deleted file mode 100644 index ad1084b0a242485512b68bd91bce462e02c2d094..0000000000000000000000000000000000000000 --- a/checkpoint-500/trainer_state.json +++ /dev/null @@ -1,464 +0,0 @@ -{ - "best_global_step": 50, - "best_metric": 0.7558398842811584, - "best_model_checkpoint": null, - "epoch": 50.0, - "eval_steps": 50, - "global_step": 500, - "is_hyper_param_search": false, - "is_local_process_zero": true, - "is_world_process_zero": true, - "log_history": [ - { - "epoch": 1.0, - "grad_norm": 1.4660576581954956, - "learning_rate": 3.6e-05, - "loss": 1.152, - "step": 10 - }, - { - "epoch": 2.0, - "grad_norm": 0.8749533295631409, - "learning_rate": 7.6e-05, - "loss": 1.0421, - "step": 20 - }, - { - "epoch": 3.0, - "grad_norm": 3.37060284614563, - "learning_rate": 0.000116, - "loss": 0.8539, - "step": 30 - }, - { - "epoch": 4.0, - "grad_norm": 1.5355278253555298, - "learning_rate": 0.00015600000000000002, - "loss": 0.5483, - "step": 40 - }, - { - "epoch": 5.0, - "grad_norm": 2.454838514328003, - "learning_rate": 0.000196, - "loss": 0.3736, - "step": 50 - }, - { - "epoch": 5.0, - "eval_loss": 0.7558398842811584, - "eval_runtime": 1.7227, - "eval_samples_per_second": 2.902, - "eval_steps_per_second": 2.902, - "step": 50 - }, - { - "epoch": 6.0, - "grad_norm": 3.676417827606201, - "learning_rate": 0.000196, - "loss": 0.2291, - "step": 60 - }, - { - "epoch": 7.0, - "grad_norm": 2.192375898361206, - "learning_rate": 0.00019155555555555554, - "loss": 0.1244, - "step": 70 - }, - { - "epoch": 8.0, - "grad_norm": 2.630005359649658, - "learning_rate": 0.00018711111111111112, - "loss": 0.0862, - "step": 80 - }, - { - "epoch": 9.0, - "grad_norm": 0.5021786093711853, - "learning_rate": 0.00018266666666666667, - "loss": 0.0614, - "step": 90 - }, - { - "epoch": 10.0, - "grad_norm": 0.38170942664146423, - "learning_rate": 0.00017822222222222222, - "loss": 0.0471, - "step": 100 - }, - { - "epoch": 10.0, - "eval_loss": 0.8806974291801453, - "eval_runtime": 1.7764, - "eval_samples_per_second": 2.815, - "eval_steps_per_second": 2.815, - "step": 100 - }, - { - "epoch": 11.0, - "grad_norm": 1.223647952079773, - "learning_rate": 0.0001737777777777778, - "loss": 0.0359, - "step": 110 - }, - { - "epoch": 12.0, - "grad_norm": 0.5452818870544434, - "learning_rate": 0.00016933333333333335, - "loss": 0.0289, - "step": 120 - }, - { - "epoch": 13.0, - "grad_norm": 0.19034886360168457, - "learning_rate": 0.0001648888888888889, - "loss": 0.029, - "step": 130 - }, - { - "epoch": 14.0, - "grad_norm": 0.7483140230178833, - "learning_rate": 0.00016044444444444445, - "loss": 0.0247, - "step": 140 - }, - { - "epoch": 15.0, - "grad_norm": 0.34800082445144653, - "learning_rate": 0.00015600000000000002, - "loss": 0.0193, - "step": 150 - }, - { - "epoch": 15.0, - "eval_loss": 0.9916993379592896, - "eval_runtime": 1.7667, - "eval_samples_per_second": 2.83, - "eval_steps_per_second": 2.83, - "step": 150 - }, - { - "epoch": 16.0, - "grad_norm": 0.24237586557865143, - "learning_rate": 0.00015155555555555557, - "loss": 0.0176, - "step": 160 - }, - { - "epoch": 17.0, - "grad_norm": 0.13607177138328552, - "learning_rate": 0.00014711111111111112, - "loss": 0.0131, - "step": 170 - }, - { - "epoch": 18.0, - "grad_norm": 0.3655266761779785, - "learning_rate": 0.00014266666666666667, - "loss": 0.0164, - "step": 180 - }, - { - "epoch": 19.0, - "grad_norm": 0.08258651196956635, - "learning_rate": 0.00013822222222222222, - "loss": 0.013, - "step": 190 - }, - { - "epoch": 20.0, - "grad_norm": 0.1830163151025772, - "learning_rate": 0.00013377777777777777, - "loss": 0.0126, - "step": 200 - }, - { - "epoch": 20.0, - "eval_loss": 1.0726474523544312, - "eval_runtime": 1.7657, - "eval_samples_per_second": 2.832, - "eval_steps_per_second": 2.832, - "step": 200 - }, - { - "epoch": 21.0, - "grad_norm": 0.12009257823228836, - "learning_rate": 0.00012933333333333332, - "loss": 0.0108, - "step": 210 - }, - { - "epoch": 22.0, - "grad_norm": 0.1172371432185173, - "learning_rate": 0.0001248888888888889, - "loss": 0.0122, - "step": 220 - }, - { - "epoch": 23.0, - "grad_norm": 0.14445751905441284, - "learning_rate": 0.00012044444444444445, - "loss": 0.0121, - "step": 230 - }, - { - "epoch": 24.0, - "grad_norm": 0.18198293447494507, - "learning_rate": 0.000116, - "loss": 0.0128, - "step": 240 - }, - { - "epoch": 25.0, - "grad_norm": 0.1562514454126358, - "learning_rate": 0.00011155555555555556, - "loss": 0.0117, - "step": 250 - }, - { - "epoch": 25.0, - "eval_loss": 1.106227159500122, - "eval_runtime": 1.7564, - "eval_samples_per_second": 2.847, - "eval_steps_per_second": 2.847, - "step": 250 - }, - { - "epoch": 26.0, - "grad_norm": 0.06052432581782341, - "learning_rate": 0.00010711111111111111, - "loss": 0.0123, - "step": 260 - }, - { - "epoch": 27.0, - "grad_norm": 0.03066837601363659, - "learning_rate": 0.00010266666666666666, - "loss": 0.0106, - "step": 270 - }, - { - "epoch": 28.0, - "grad_norm": 0.034792304039001465, - "learning_rate": 9.822222222222223e-05, - "loss": 0.0124, - "step": 280 - }, - { - "epoch": 29.0, - "grad_norm": 0.028368409723043442, - "learning_rate": 9.377777777777779e-05, - "loss": 0.0107, - "step": 290 - }, - { - "epoch": 30.0, - "grad_norm": 0.03258921578526497, - "learning_rate": 8.933333333333334e-05, - "loss": 0.0109, - "step": 300 - }, - { - "epoch": 30.0, - "eval_loss": 1.1306606531143188, - "eval_runtime": 1.7675, - "eval_samples_per_second": 2.829, - "eval_steps_per_second": 2.829, - "step": 300 - }, - { - "epoch": 31.0, - "grad_norm": 0.26905232667922974, - "learning_rate": 8.488888888888889e-05, - "loss": 0.0131, - "step": 310 - }, - { - "epoch": 32.0, - "grad_norm": 0.15363195538520813, - "learning_rate": 8.044444444444444e-05, - "loss": 0.0121, - "step": 320 - }, - { - "epoch": 33.0, - "grad_norm": 0.030869223177433014, - "learning_rate": 7.6e-05, - "loss": 0.0104, - "step": 330 - }, - { - "epoch": 34.0, - "grad_norm": 0.07273676246404648, - "learning_rate": 7.155555555555555e-05, - "loss": 0.0112, - "step": 340 - }, - { - "epoch": 35.0, - "grad_norm": 0.025629112496972084, - "learning_rate": 6.711111111111112e-05, - "loss": 0.0121, - "step": 350 - }, - { - "epoch": 35.0, - "eval_loss": 1.128761887550354, - "eval_runtime": 1.7518, - "eval_samples_per_second": 2.854, - "eval_steps_per_second": 2.854, - "step": 350 - }, - { - "epoch": 36.0, - "grad_norm": 0.06929411739110947, - "learning_rate": 6.266666666666667e-05, - "loss": 0.0099, - "step": 360 - }, - { - "epoch": 37.0, - "grad_norm": 0.102758027613163, - "learning_rate": 5.8222222222222224e-05, - "loss": 0.0096, - "step": 370 - }, - { - "epoch": 38.0, - "grad_norm": 0.19261795282363892, - "learning_rate": 5.377777777777778e-05, - "loss": 0.0112, - "step": 380 - }, - { - "epoch": 39.0, - "grad_norm": 0.23121486604213715, - "learning_rate": 4.933333333333334e-05, - "loss": 0.0117, - "step": 390 - }, - { - "epoch": 40.0, - "grad_norm": 0.13266825675964355, - "learning_rate": 4.4888888888888894e-05, - "loss": 0.0113, - "step": 400 - }, - { - "epoch": 40.0, - "eval_loss": 1.1694066524505615, - "eval_runtime": 1.7708, - "eval_samples_per_second": 2.824, - "eval_steps_per_second": 2.824, - "step": 400 - }, - { - "epoch": 41.0, - "grad_norm": 0.17276649177074432, - "learning_rate": 4.0444444444444444e-05, - "loss": 0.0103, - "step": 410 - }, - { - "epoch": 42.0, - "grad_norm": 0.13706862926483154, - "learning_rate": 3.6e-05, - "loss": 0.0115, - "step": 420 - }, - { - "epoch": 43.0, - "grad_norm": 0.1022062748670578, - "learning_rate": 3.155555555555556e-05, - "loss": 0.0118, - "step": 430 - }, - { - "epoch": 44.0, - "grad_norm": 0.11416096985340118, - "learning_rate": 2.7111111111111114e-05, - "loss": 0.0096, - "step": 440 - }, - { - "epoch": 45.0, - "grad_norm": 0.14480136334896088, - "learning_rate": 2.2666666666666668e-05, - "loss": 0.0093, - "step": 450 - }, - { - "epoch": 45.0, - "eval_loss": 1.1621501445770264, - "eval_runtime": 1.7753, - "eval_samples_per_second": 2.816, - "eval_steps_per_second": 2.816, - "step": 450 - }, - { - "epoch": 46.0, - "grad_norm": 0.1180804893374443, - "learning_rate": 1.8222222222222224e-05, - "loss": 0.0126, - "step": 460 - }, - { - "epoch": 47.0, - "grad_norm": 0.05086653307080269, - "learning_rate": 1.3777777777777778e-05, - "loss": 0.0111, - "step": 470 - }, - { - "epoch": 48.0, - "grad_norm": 0.032583802938461304, - "learning_rate": 9.333333333333334e-06, - "loss": 0.0094, - "step": 480 - }, - { - "epoch": 49.0, - "grad_norm": 0.04545021802186966, - "learning_rate": 4.888888888888889e-06, - "loss": 0.0117, - "step": 490 - }, - { - "epoch": 50.0, - "grad_norm": 0.05125224590301514, - "learning_rate": 4.444444444444445e-07, - "loss": 0.0105, - "step": 500 - }, - { - "epoch": 50.0, - "eval_loss": 1.169873833656311, - "eval_runtime": 1.7599, - "eval_samples_per_second": 2.841, - "eval_steps_per_second": 2.841, - "step": 500 - } - ], - "logging_steps": 10, - "max_steps": 500, - "num_input_tokens_seen": 0, - "num_train_epochs": 50, - "save_steps": 100, - "stateful_callbacks": { - "TrainerControl": { - "args": { - "should_epoch_stop": false, - "should_evaluate": false, - "should_log": false, - "should_save": true, - "should_training_stop": true - }, - "attributes": {} - } - }, - "total_flos": 6.63775195693056e+16, - "train_batch_size": 1, - "trial_name": null, - "trial_params": null -} diff --git a/checkpoint-500/training_args.bin b/checkpoint-500/training_args.bin deleted file mode 100644 index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000 --- a/checkpoint-500/training_args.bin +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f -size 5777 diff --git a/special_tokens_map.json b/special_tokens_map.json deleted file mode 100644 index b90a4f3ca8530c09c5723f153257607c6fdabefc..0000000000000000000000000000000000000000 --- a/special_tokens_map.json +++ /dev/null @@ -1,40 +0,0 @@ -{ - "additional_special_tokens": [ - "▁
",
-    "▁",
-    "▁",
-    "▁",
-    "▁
",
-    "▁",
-    "▁",
-    "▁"
-  ],
-  "bos_token": {
-    "content": "",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "eos_token": {
-    "content": "",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "pad_token": {
-    "content": "",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "unk_token": {
-    "content": "",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  }
-}
diff --git a/tokenizer.json b/tokenizer.json
deleted file mode 100644
index fa5d179a4294feaa4747648098eaacd84fae3b98..0000000000000000000000000000000000000000
--- a/tokenizer.json
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:3db85ad6e5063687453d32b28de462a4fc7c6809c38c1b45326e2efe6e6fbee6
-size 3620984
diff --git a/tokenizer_config.json b/tokenizer_config.json
deleted file mode 100644
index f47206bd85c500c1451b5821065dfc19e7fc2372..0000000000000000000000000000000000000000
--- a/tokenizer_config.json
+++ /dev/null
@@ -1,95 +0,0 @@
-{
-  "add_bos_token": true,
-  "add_eos_token": false,
-  "added_tokens_decoder": {
-    "0": {
-      "content": "",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "1": {
-      "content": "",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "2": {
-      "content": "",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "32007": {
-      "content": "▁
",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "32008": {
-      "content": "▁",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "32009": {
-      "content": "▁",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "32010": {
-      "content": "▁",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    }
-  },
-  "additional_special_tokens": [
-    "▁
",
-    "▁",
-    "▁",
-    "▁",
-    "▁
",
-    "▁",
-    "▁",
-    "▁"
-  ],
-  "bos_token": "",
-  "clean_up_tokenization_spaces": false,
-  "eos_token": "",
-  "eot_token": "▁",
-  "extra_special_tokens": {},
-  "fill_token": "",
-  "legacy": null,
-  "max_length": 2048,
-  "middle_token": "▁",
-  "model_max_length": 1000000000000000019884624838656,
-  "pad_to_multiple_of": null,
-  "pad_token": "",
-  "pad_token_type_id": 0,
-  "padding_side": "right",
-  "prefix_token": "▁
",
-  "sp_model_kwargs": {},
-  "stride": 0,
-  "suffix_token": "▁",
-  "tokenizer_class": "CodeLlamaTokenizerFast",
-  "truncation_side": "right",
-  "truncation_strategy": "longest_first",
-  "unk_token": "",
-  "use_default_system_prompt": false
-}
diff --git a/training_args.bin b/training_args.bin
deleted file mode 100644
index b6f9b4d71f20cf64f37af77abb548787efcfd08e..0000000000000000000000000000000000000000
--- a/training_args.bin
+++ /dev/null
@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:cc19cfb8a50d9a9f7e0159709202419ad710285a055c411c21b750985626198f
-size 5777