crumb commited on
Commit
a7e6f49
1 Parent(s): 6af521f

Upload model

Browse files
Files changed (2) hide show
  1. config.json +4 -3
  2. model.safetensors +1 -1
config.json CHANGED
@@ -1,11 +1,12 @@
1
  {
 
2
  "activation_function": "silu",
3
  "architectures": [
4
  "PlusModelForCausalLM"
5
  ],
6
  "auto_map": {
7
- "AutoConfig": "configuration_nano.NanoConfig",
8
- "AutoModelForCausalLM": "modeling_nano.PlusModelForCausalLM"
9
  },
10
  "bos_token_id": 1,
11
  "combined_qkv": true,
@@ -34,6 +35,6 @@
34
  "torch_dtype": "bfloat16",
35
  "transformers_version": "4.36.2",
36
  "use_bias": false,
37
- "use_cache": true,
38
  "vocab_size": 32000
39
  }
 
1
  {
2
+ "_name_or_path": "crumb/parallama-p8192-base-init",
3
  "activation_function": "silu",
4
  "architectures": [
5
  "PlusModelForCausalLM"
6
  ],
7
  "auto_map": {
8
+ "AutoConfig": "crumb/parallama-p8192-base-init--configuration_nano.NanoConfig",
9
+ "AutoModelForCausalLM": "crumb/parallama-p8192-base-init--modeling_nano.PlusModelForCausalLM"
10
  },
11
  "bos_token_id": 1,
12
  "combined_qkv": true,
 
35
  "torch_dtype": "bfloat16",
36
  "transformers_version": "4.36.2",
37
  "use_bias": false,
38
+ "use_cache": false,
39
  "vocab_size": 32000
40
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c5ca3f770208ce4f3cd1e358482ca79f38018aedb49a65f091b9794594f44bda
3
  size 738239160
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5d823cecb0b6e9e1213e7bf618a81dd6637c7066d745073e1dc1c2f08956361
3
  size 738239160