michaelbenayoun HF Staff commited on
Commit
6f4bcbe
·
verified ·
1 Parent(s): 3592608

Upload DeepseekV3ForCausalLM

Browse files
Files changed (2) hide show
  1. config.json +1 -1
  2. model.safetensors +2 -2
config.json CHANGED
@@ -35,7 +35,7 @@
35
  "num_nextn_predict_layers": 0,
36
  "pretraining_tp": 1,
37
  "q_lora_rank": 48,
38
- "qk_head_dim": 48,
39
  "qk_nope_head_dim": 32,
40
  "qk_rope_head_dim": 32,
41
  "quantization_config": {
 
35
  "num_nextn_predict_layers": 0,
36
  "pretraining_tp": 1,
37
  "q_lora_rank": 48,
38
+ "qk_head_dim": 64,
39
  "qk_nope_head_dim": 32,
40
  "qk_rope_head_dim": 32,
41
  "quantization_config": {
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1df2c380c0a617c83807445c3a2779128ba1677f2b8e2d9a794164cb4eacd1a2
3
- size 115530536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc77d5fa0f43af6e87ad6c1696b4463d169316adce893db57ae731bc268557ca
3
+ size 115727160