Update model
Browse files- Luau-Devstral-24B-Instruct-v0.1-BF16.gguf +2 -2
- Luau-Devstral-24B-Instruct-v0.1-IQ1_M.gguf +2 -2
- Luau-Devstral-24B-Instruct-v0.1-IQ2_M.gguf +2 -2
- Luau-Devstral-24B-Instruct-v0.1-IQ3_M.gguf +2 -2
- Luau-Devstral-24B-Instruct-v0.1-IQ4_xs.gguf +3 -0
- Luau-Devstral-24B-Instruct-v0.1-Q3_K_M.gguf +2 -2
- Luau-Devstral-24B-Instruct-v0.1-Q4_K_M.gguf +2 -2
- Luau-Devstral-24B-Instruct-v0.1-Q5_K_M.gguf +2 -2
- Luau-Devstral-24B-Instruct-v0.1-Q6_K.gguf +2 -2
- Luau-Devstral-24B-Instruct-v0.1-Q8_0.gguf +2 -2
- README.md +27 -20
- config.json +2 -2
- generation_config.json +1 -1
- imatrix.gguf +2 -2
- model-00001-of-00010.safetensors +1 -1
- model-00002-of-00010.safetensors +1 -1
- model-00003-of-00010.safetensors +1 -1
- model-00004-of-00010.safetensors +1 -1
- model-00005-of-00010.safetensors +1 -1
- model-00006-of-00010.safetensors +1 -1
- model-00007-of-00010.safetensors +1 -1
- model-00008-of-00010.safetensors +1 -1
- model-00009-of-00010.safetensors +1 -1
- model-00010-of-00010.safetensors +1 -1
- model.safetensors.index.json +1 -1
- tokenizer_config.json +1 -1
Luau-Devstral-24B-Instruct-v0.1-BF16.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f57afbcf52d437a7c3f896254f7ed6032f19878d462c5a968adc1acab171e1a9
|
3 |
+
size 47153529600
|
Luau-Devstral-24B-Instruct-v0.1-IQ1_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ba104c7049f27ecc91a76531c1a3dc782ee591101f9aab363a094fdc809e7be
|
3 |
+
size 5750506496
|
Luau-Devstral-24B-Instruct-v0.1-IQ2_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9f7fac543dd425a96f06488f4a7b511208ef201ac6e500af718dd6628074008
|
3 |
+
size 8114062336
|
Luau-Devstral-24B-Instruct-v0.1-IQ3_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e5a09df7f661b58b9ee93d9dbbd377c184ee208d99224b0a0442affa6790da2
|
3 |
+
size 10650960896
|
Luau-Devstral-24B-Instruct-v0.1-IQ4_xs.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e671eb18e1592333f1fac3703645eb91445f098d05ebd410a200506b44919d48
|
3 |
+
size 12758926336
|
Luau-Devstral-24B-Instruct-v0.1-Q3_K_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b5a44e23750727217bd6ce982c67374b75af5720acb892b108bc5883146c987
|
3 |
+
size 11474093056
|
Luau-Devstral-24B-Instruct-v0.1-Q4_K_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f430a622277f25ecb40a3d144e5aec2769bebdc831bd46a9cfcae7c217424992
|
3 |
+
size 14333920256
|
Luau-Devstral-24B-Instruct-v0.1-Q5_K_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:113f1f3b6609bd3ce2acf93255740dede0a194cb6e0d3dc2fe18d25442fd8e96
|
3 |
+
size 16763995136
|
Luau-Devstral-24B-Instruct-v0.1-Q6_K.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e951fbff41020f3fd150648d676e9074e022190904ff1a1d93414a38793eb22
|
3 |
+
size 19345949696
|
Luau-Devstral-24B-Instruct-v0.1-Q8_0.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a390a16f77f62e33c70b654f92ffca90d7e0c763cda9a1aad00f96c1f8ab03d2
|
3 |
+
size 25054790656
|
README.md
CHANGED
@@ -11,7 +11,7 @@ language:
|
|
11 |
- pt
|
12 |
- it
|
13 |
base_model:
|
14 |
-
- unsloth/Devstral-Small-2507
|
15 |
tags:
|
16 |
- roblox
|
17 |
- luau
|
@@ -35,7 +35,7 @@ Devstral Small 2507 is a powerful choice for local inference, achieving SOTA ope
|
|
35 |
- **Developed by:** Zack Williams ([boatbomber](https://huggingface.co/boatbomber))
|
36 |
- **Funded by:** [Torpedo Software LLC](https://huggingface.co/TorpedoSoftware)
|
37 |
- **License:** [Apache 2.0](https://www.tldrlegal.com/license/apache-license-2-0-apache-2-0)
|
38 |
-
- **Finetuned from model:** [unsloth/Devstral-Small-2507
|
39 |
|
40 |
### Model Sources
|
41 |
|
@@ -48,22 +48,31 @@ Devstral Small 2507 is a powerful choice for local inference, achieving SOTA ope
|
|
48 |
### Training Data
|
49 |
|
50 |
1. https://huggingface.co/datasets/TorpedoSoftware/the-luau-stack
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
51 |
2. https://huggingface.co/datasets/TorpedoSoftware/roblox-info-dump
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
52 |
|
53 |
-
|
54 |
|
55 |
-
|
56 |
-
|
57 |
-
```md
|
58 |
-
Repository: {repo_name}
|
59 |
-
Repository Description: {repo_description}
|
60 |
-
|
61 |
-
File Path: `{file_path}`
|
62 |
-
File Content:
|
63 |
-
```Lua
|
64 |
-
{file_content}
|
65 |
-
```\
|
66 |
-
```
|
67 |
|
68 |
### Training Loss Curve
|
69 |
|
@@ -71,14 +80,12 @@ File Content:
|
|
71 |
|
72 |
### Imatrix Calibration
|
73 |
|
74 |
-
The imatrix for the GGUF quantizations was computed using
|
75 |
|
76 |
## Environmental Impact
|
77 |
|
78 |
Carbon emissions estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
|
79 |
|
80 |
-
- **Hardware Type:**
|
81 |
- **Hours used:** 60
|
82 |
-
- **
|
83 |
-
- **Compute Region:** Bay Area
|
84 |
-
- **Carbon Emitted:** 4.73 kg CO2eq (equivalent to 11.8 miles driven by an average ICE car)
|
|
|
11 |
- pt
|
12 |
- it
|
13 |
base_model:
|
14 |
+
- unsloth/Devstral-Small-2507
|
15 |
tags:
|
16 |
- roblox
|
17 |
- luau
|
|
|
35 |
- **Developed by:** Zack Williams ([boatbomber](https://huggingface.co/boatbomber))
|
36 |
- **Funded by:** [Torpedo Software LLC](https://huggingface.co/TorpedoSoftware)
|
37 |
- **License:** [Apache 2.0](https://www.tldrlegal.com/license/apache-license-2-0-apache-2-0)
|
38 |
+
- **Finetuned from model:** [unsloth/Devstral-Small-2507](https://huggingface.co/unsloth/Devstral-Small-2507)
|
39 |
|
40 |
### Model Sources
|
41 |
|
|
|
48 |
### Training Data
|
49 |
|
50 |
1. https://huggingface.co/datasets/TorpedoSoftware/the-luau-stack
|
51 |
+
|
52 |
+
Format:
|
53 |
+
```md
|
54 |
+
Repository: {repo_name}
|
55 |
+
Repository Description: {repo_description}
|
56 |
+
|
57 |
+
File Path: `{file_path}`
|
58 |
+
File Content:
|
59 |
+
```Lua
|
60 |
+
{file_content}
|
61 |
+
```\
|
62 |
+
```
|
63 |
2. https://huggingface.co/datasets/TorpedoSoftware/roblox-info-dump
|
64 |
+
|
65 |
+
Format:
|
66 |
+
```md
|
67 |
+
Roblox Creator Docs: {url}
|
68 |
+
```md
|
69 |
+
{content}
|
70 |
+
```\
|
71 |
+
```
|
72 |
|
73 |
+
### Training Process
|
74 |
|
75 |
+
Trained a LoRA adapter (r=64) at full precision on two epochs of the dataset for a total of 54,630 steps and 43.40 E FLOPs. Then merged the final adapter checkpoint into a BF16 model.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
76 |
|
77 |
### Training Loss Curve
|
78 |
|
|
|
80 |
|
81 |
### Imatrix Calibration
|
82 |
|
83 |
+
The imatrix for the GGUF quantizations was computed using 5.73MB of text containing a combination of [technical.txt](https://huggingface.co/datasets/froggeric/imatrix/blob/main/technical.txt), [groups_merged.txt](huggingface.co/datasets/froggeric/imatrix/blob/main/groups_merged.txt), and content from [the-luau-stack](https://huggingface.co/datasets/TorpedoSoftware/the-luau-stack) & [roblox-info-dump](https://huggingface.co/datasets/TorpedoSoftware/roblox-info-dump). This created an imatrix that is well suited to the specialized tasks this model is designed for while still maintaining broader intelligence as well. While we do provide several quantizations already, the `imatrix.gguf` is included in this repository should you want to create other quants yourself.
|
84 |
|
85 |
## Environmental Impact
|
86 |
|
87 |
Carbon emissions estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
|
88 |
|
89 |
+
- **Hardware Type:** A100 80GB PCIe
|
90 |
- **Hours used:** 60
|
91 |
+
- **Carbon Emitted:** ~4.5 kg CO2eq (equivalent to ~10.1 miles driven by an average ICE car)
|
|
|
|
config.json
CHANGED
@@ -22,9 +22,9 @@
|
|
22 |
"sliding_window": null,
|
23 |
"tie_word_embeddings": false,
|
24 |
"torch_dtype": "bfloat16",
|
25 |
-
"transformers_version": "4.55.
|
26 |
"unsloth_fixed": true,
|
27 |
-
"unsloth_version": "2025.8.
|
28 |
"use_cache": true,
|
29 |
"vocab_size": 131072
|
30 |
}
|
|
|
22 |
"sliding_window": null,
|
23 |
"tie_word_embeddings": false,
|
24 |
"torch_dtype": "bfloat16",
|
25 |
+
"transformers_version": "4.55.3",
|
26 |
"unsloth_fixed": true,
|
27 |
+
"unsloth_version": "2025.8.9",
|
28 |
"use_cache": true,
|
29 |
"vocab_size": 131072
|
30 |
}
|
generation_config.json
CHANGED
@@ -4,5 +4,5 @@
|
|
4 |
"eos_token_id": 2,
|
5 |
"max_length": 131072,
|
6 |
"pad_token_id": 11,
|
7 |
-
"transformers_version": "4.55.
|
8 |
}
|
|
|
4 |
"eos_token_id": 2,
|
5 |
"max_length": 131072,
|
6 |
"pad_token_id": 11,
|
7 |
+
"transformers_version": "4.55.3"
|
8 |
}
|
imatrix.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43e84a154059602f576de657d723d7f35aeb929660ee8f78238388e5d64e3f84
|
3 |
+
size 10037344
|
model-00001-of-00010.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4781571736
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24e3d5e7f129926fbbc91099bc357ed8dad2d535c00935b747738b97b5bc602a
|
3 |
size 4781571736
|
model-00002-of-00010.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4781592784
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7659bd8dc9c015c6ed3cb6acfdbabe3195eb33aac6475ddc1a2d080b715eea78
|
3 |
size 4781592784
|
model-00003-of-00010.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4781592800
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da3d9b538cd7c9a689ca42819a935f2654f4e69dbbdb9ab27e8f264e1a504b81
|
3 |
size 4781592800
|
model-00004-of-00010.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4886471600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71cd682ad99eb857404b24616bbaa9b9fc9741a62d1c4421ba6bcd5a9d55944b
|
3 |
size 4886471600
|
model-00005-of-00010.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4781592824
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c364dc773505c6eaa70ecde6f2c0a4fc8cade2921d978d8f1a3190a7121e3b45
|
3 |
size 4781592824
|
model-00006-of-00010.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4781592816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dda03a2c951066cc3b5d84bf939264fa94557ffb1a37da42cadeac3cc95f0eb0
|
3 |
size 4781592816
|
model-00007-of-00010.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4886471600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc5527a3f6c7a736129e275e166ea054b327ac74fb16e891feabfd2088c1aea0
|
3 |
size 4886471600
|
model-00008-of-00010.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4781592824
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e24bbb48a307739507bef06531ede237884fbb4c0f9e3d5c33b72b9ba2edc22f
|
3 |
size 4781592824
|
model-00009-of-00010.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4781592816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:735e74b7c38a12cd2d607514d50d5c8591c22fc88baa153396ba9c393562c060
|
3 |
size 4781592816
|
model-00010-of-00010.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3900777072
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a57790fb693007a0af0af4351dbc0a6367f25789d9422874f8d50cae1a487b0
|
3 |
size 3900777072
|
model.safetensors.index.json
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
{
|
2 |
"metadata": {
|
3 |
-
"total_parameters":
|
4 |
"total_size": 47144806400
|
5 |
},
|
6 |
"weight_map": {
|
|
|
1 |
{
|
2 |
"metadata": {
|
3 |
+
"total_parameters": 23572403200,
|
4 |
"total_size": 47144806400
|
5 |
},
|
6 |
"weight_map": {
|
tokenizer_config.json
CHANGED
@@ -9013,7 +9013,7 @@
|
|
9013 |
"legacy": true,
|
9014 |
"model_max_length": 131072,
|
9015 |
"pad_token": "<pad>",
|
9016 |
-
"padding_side": "
|
9017 |
"tokenizer_class": "LlamaTokenizerFast",
|
9018 |
"unk_token": "<unk>",
|
9019 |
"use_default_system_prompt": false
|
|
|
9013 |
"legacy": true,
|
9014 |
"model_max_length": 131072,
|
9015 |
"pad_token": "<pad>",
|
9016 |
+
"padding_side": "right",
|
9017 |
"tokenizer_class": "LlamaTokenizerFast",
|
9018 |
"unk_token": "<unk>",
|
9019 |
"use_default_system_prompt": false
|