boatbomber commited on
Commit
655f446
·
1 Parent(s): 7dffdc4

Update model

Browse files
DeepSeek-R1-Distill-Qwen-14B-Roblox-Luau-BF16.gguf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9cf529b42ba4504c01eb295ce6db4041fa34d4c5b8d767d5aa8b5e75adf9c11a
3
- size 29547715616
 
 
 
 
DeepSeek-R1-Distill-Qwen-14B-Roblox-Luau-F16.gguf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:2de7f7306aead27e445ca8996012bdbfa435f2470d7c8fa3b1f5e090dd8054e5
3
- size 29547716416
 
 
 
 
DeepSeek-R1-Distill-Qwen-14B-Roblox-Luau-Q3_K_M.gguf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8764b790108be382c9fbba69f553a599faa661ca44b8c412dbbc5688cbffba5f
3
- size 7339203616
 
 
 
 
DeepSeek-R1-Distill-Qwen-14B-Roblox-Luau-Q4_K_M.gguf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5bd43bf2279aff6739c85caad8a223137abda141879abbd7e715aa7a0a54aa1
3
- size 8988109856
 
 
 
 
DeepSeek-R1-Distill-Qwen-14B-Roblox-Luau-Q4_K_S.gguf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:81a0348c02ef0ea1366fa1543430d99ed7bafec0dee5f3cc5998c6363c318c4d
3
- size 8573430816
 
 
 
 
DeepSeek-R1-Distill-Qwen-14B-Roblox-Luau-Q5_K_M.gguf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d9ed5b2c7ae1601c65a3026149189707c1d94049f77102bd5cfbf484780209f
3
- size 10508872736
 
 
 
 
DeepSeek-R1-Distill-Qwen-14B-Roblox-Luau-Q5_K_S.gguf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:5976908470afb5f45779d6114efc7e6ee0eaed9a61524c169bee05019e29fef0
3
- size 10266553376
 
 
 
 
DeepSeek-R1-Distill-Qwen-14B-Roblox-Luau-Q6_K.gguf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b73bf089fa0fa04df9f2ca728bf55910bf12c1498dc7c0b75d85270ecb68247
3
- size 12124683296
 
 
 
 
DeepSeek-R1-Distill-Qwen-14B-Roblox-Luau-Q8_0.gguf DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9a6afdba6808b313ec694f0b6f23673e89299f8f21258923252b5d931c73552
3
- size 15701597216
 
 
 
 
README.md CHANGED
@@ -15,7 +15,7 @@ language:
15
 
16
  # R1-Distill-Qwen-14B-Roblox-Luau
17
 
18
- A fine tune of [deepseek-ai/DeepSeek-R1-Distill-Qwen-14B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B) using [boatbomber/Roblox-Luau-Reasoning-v1.0](https://huggingface.co/datasets/boatbomber/Roblox-Luau-Reasoning-v1.0). Fine tuning workflow is open sourced [here](https://huggingface.co/boatbomber/R1-Distill-Qwen-14B-Roblox-Luau/blob/main/run-finetune.ipynb).
19
 
20
  Recommended inference settings:
21
 
 
15
 
16
  # R1-Distill-Qwen-14B-Roblox-Luau
17
 
18
+ A fine tune of [deepseek-ai/DeepSeek-R1-Distill-Qwen-14B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B) using [boatbomber/Roblox-Luau-Reasoning-v1.0](https://huggingface.co/datasets/boatbomber/Roblox-Luau-Reasoning-v1.0), [boatbomber/roblox-info-dump](https://huggingface.co/datasets/boatbomber/roblox-info-dump), and [boatbomber/the-luau-stack](https://huggingface.co/datasets/boatbomber/the-luau-stack).
19
 
20
  Recommended inference settings:
21
 
config.json CHANGED
@@ -1,6 +1,7 @@
1
  {
2
- "_name_or_path": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
3
- "architectures": ["Qwen2ForCausalLM"],
 
4
  "attention_dropout": 0.0,
5
  "bos_token_id": 151643,
6
  "eos_token_id": 151643,
@@ -14,13 +15,13 @@
14
  "num_attention_heads": 40,
15
  "num_hidden_layers": 48,
16
  "num_key_value_heads": 8,
17
- "rms_norm_eps": 1e-5,
18
  "rope_scaling": null,
19
  "rope_theta": 1000000.0,
20
- "sliding_window": null,
21
  "tie_word_embeddings": false,
22
  "torch_dtype": "bfloat16",
23
- "transformers_version": "4.47.1",
24
  "use_cache": true,
25
  "use_sliding_window": false,
26
  "vocab_size": 152064
 
1
  {
2
+ "architectures": [
3
+ "Qwen2ForCausalLM"
4
+ ],
5
  "attention_dropout": 0.0,
6
  "bos_token_id": 151643,
7
  "eos_token_id": 151643,
 
15
  "num_attention_heads": 40,
16
  "num_hidden_layers": 48,
17
  "num_key_value_heads": 8,
18
+ "rms_norm_eps": 1e-05,
19
  "rope_scaling": null,
20
  "rope_theta": 1000000.0,
21
+ "sliding_window": 131072,
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "bfloat16",
24
+ "transformers_version": "4.51.2",
25
  "use_cache": true,
26
  "use_sliding_window": false,
27
  "vocab_size": 152064
generation_config.json CHANGED
@@ -5,5 +5,5 @@
5
  "eos_token_id": 151643,
6
  "temperature": 0.6,
7
  "top_p": 0.95,
8
- "transformers_version": "4.47.1"
9
  }
 
5
  "eos_token_id": 151643,
6
  "temperature": 0.6,
7
  "top_p": 0.95,
8
+ "transformers_version": "4.51.2"
9
  }
model-00001-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:235a3c85da149f98c86cd70fad6c2c56e61a9599ea0c95227cce4574d646b748
3
  size 4986211280
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8293a3cb9b2e377217c58e92ab67c1cace58a3571ef530e1d77ed85301780e5
3
  size 4986211280
model-00002-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f6255be1d4d23c927f62d0d3555be9b0607132d212c852188b7195f138344e8
3
  size 4954847344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e3d50c5168c053e8c9b531967cb3ba32ed5f2463d85b4d351afeb021f84e26c
3
  size 4954847344
model-00003-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:926a287e5907d07c453b35e0fb73902f101721317d3eb89ac71af08a663cb9e8
3
  size 4954847392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b01a1117ff3aa71a4f9777f241f176317c7e98281d1f9b32cc55127b56818eb4
3
  size 4954847392
model-00004-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a08edb7f6ff16f50addb792dbe45308913ad6d41b7abd807379a540684dd923
3
  size 4954847392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:805cbea53195b7dd046244aea46ac6e831669bce5b33ebe35f1cc70913505317
3
  size 4954847392
model-00005-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfee7450e95aefdd2f4d09b24a078c595758d1b10e9d6ad2f13deb55a08bce88
3
  size 4954847392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7856ba7e9daf5cc88ad0e366445a2dc63805a2061d0d30a6cad1c786b913a018
3
  size 4954847392
model-00006-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a90126ba44728eec5ffe16a31d4e6a3e8d0dec1e7d512b0693a8c5d711e513fd
3
  size 4734533160
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a622395ca2f76493ae50c5c09c62b88e341c09681da1a3dc7230a9a2e2febe18
3
  size 4734533160
tokenizer_config.json CHANGED
@@ -189,7 +189,7 @@
189
  "model_max_length": 16384,
190
  "pad_token": "<|end▁of▁sentence|>",
191
  "sp_model_kwargs": {},
192
- "tokenizer_class": "LlamaTokenizer",
193
  "unk_token": null,
194
  "use_default_system_prompt": false
195
  }
 
189
  "model_max_length": 16384,
190
  "pad_token": "<|end▁of▁sentence|>",
191
  "sp_model_kwargs": {},
192
+ "tokenizer_class": "LlamaTokenizerFast",
193
  "unk_token": null,
194
  "use_default_system_prompt": false
195
  }