jinliuxi commited on
Commit
4762455
·
verified ·
1 Parent(s): 22aa719

Upload DeepseekV3ForCausalLM

Browse files
Files changed (3) hide show
  1. README.md +1 -1
  2. config.json +1 -6
  3. model.safetensors +1 -1
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- license: apache-2.0
3
  language:
4
  - zh
5
  - en
 
1
  ---
2
+ license: apache-2.0
3
  language:
4
  - zh
5
  - en
config.json CHANGED
@@ -1,13 +1,8 @@
1
  {
2
- "_name_or_path": "deepseekmini_2048",
3
  "architectures": [
4
  "DeepseekV3ForCausalLM"
5
  ],
6
- "auto_map": {
7
- "AutoConfig": "configuration_deepseek.DeepseekV3Config",
8
- "AutoModel": "modeling_deepseek.DeepseekV3Model",
9
- "AutoModelForCausalLM": "modeling_deepseek.DeepseekV3ForCausalLM"
10
- },
11
  "attention_bias": false,
12
  "attention_dropout": 0.0,
13
  "aux_loss_alpha": 0.001,
 
1
  {
2
+ "_name_or_path": "deepseekmini_highit/checkpoint-4961",
3
  "architectures": [
4
  "DeepseekV3ForCausalLM"
5
  ],
 
 
 
 
 
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "aux_loss_alpha": 0.001,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b13d34595071466d71f66c5fcaaa8f552f4609847ac6a2b9ceb3ccdc19c4328
3
  size 1341455152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98fc5b5efcdf56b90674b33dec996f4dd9b93220c5115caf9d10c0c2b4fc8060
3
  size 1341455152