jeffra's picture
Upload config.json with huggingface_hub
b9e8309 verified
{
"architectures": [
"ArcticLSTMSpeculatorPreTrainedModel"
],
"base_model_name_or_path": "meta-llama/Llama-3.3-70B-Instruct",
"input_hidden_dim": 8192,
"inner_dim": "6144",
"proj_dim": "6144",
"emb_dim": "6144",
"model_type": "mlp_speculator",
"n_candidates": 3,
"n_predict": 3,
"scale_input": true,
"tie_weights": true,
"tie_lstm_embs": true,
"top_k_tokens_per_head": [
1,
1,
1
],
"torch_dtype": "bfloat16",
"transformers_version": "4.47.0",
"vocab_size": 128256,
"method": "sum_lstm"
}