Snowflake
/

Arctic-LSTM-Speculator-Llama-3.3-70B-Instruct

jeffra commited on Apr 30

Commit

b9e8309

verified ·

1 Parent(s): d4e4797

Upload config.json with huggingface_hub

Files changed (1) hide show

config.json ADDED Viewed

+{
+  "architectures": [
+    "ArcticLSTMSpeculatorPreTrainedModel"
+  ],
+  "base_model_name_or_path": "meta-llama/Llama-3.3-70B-Instruct",
+  "input_hidden_dim": 8192,
+  "inner_dim": "6144",
+  "proj_dim": "6144",
+  "emb_dim": "6144",
+  "model_type": "mlp_speculator",
+  "n_candidates": 3,
+  "n_predict": 3,
+  "scale_input": true,
+  "tie_weights": true,
+  "tie_lstm_embs": true,
+  "top_k_tokens_per_head": [
+    1,
+    1,
+    1
+  ],
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.47.0",
+  "vocab_size": 128256,
+  "method": "sum_lstm"
+}