NicoNico commited on
Commit
f79ec17
·
verified ·
1 Parent(s): 24bdd25

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +30 -0
  2. config.json +71 -0
  3. model-00001-of-00088.safetensors +3 -0
  4. model-00002-of-00088.safetensors +3 -0
  5. model-00003-of-00088.safetensors +3 -0
  6. model-00004-of-00088.safetensors +3 -0
  7. model-00005-of-00088.safetensors +3 -0
  8. model-00006-of-00088.safetensors +3 -0
  9. model-00007-of-00088.safetensors +3 -0
  10. model-00008-of-00088.safetensors +3 -0
  11. model-00009-of-00088.safetensors +3 -0
  12. model-00010-of-00088.safetensors +3 -0
  13. model-00011-of-00088.safetensors +3 -0
  14. model-00012-of-00088.safetensors +3 -0
  15. model-00013-of-00088.safetensors +3 -0
  16. model-00014-of-00088.safetensors +3 -0
  17. model-00015-of-00088.safetensors +3 -0
  18. model-00016-of-00088.safetensors +3 -0
  19. model-00017-of-00088.safetensors +3 -0
  20. model-00018-of-00088.safetensors +3 -0
  21. model-00019-of-00088.safetensors +3 -0
  22. model-00020-of-00088.safetensors +3 -0
  23. model-00021-of-00088.safetensors +3 -0
  24. model-00022-of-00088.safetensors +3 -0
  25. model-00023-of-00088.safetensors +3 -0
  26. model-00024-of-00088.safetensors +3 -0
  27. model-00025-of-00088.safetensors +3 -0
  28. model-00026-of-00088.safetensors +3 -0
  29. model-00027-of-00088.safetensors +3 -0
  30. model-00028-of-00088.safetensors +3 -0
  31. model-00029-of-00088.safetensors +3 -0
  32. model-00030-of-00088.safetensors +3 -0
  33. model-00031-of-00088.safetensors +3 -0
  34. model-00032-of-00088.safetensors +3 -0
  35. model-00033-of-00088.safetensors +3 -0
  36. model-00034-of-00088.safetensors +3 -0
  37. model-00035-of-00088.safetensors +3 -0
  38. model-00036-of-00088.safetensors +3 -0
  39. model-00037-of-00088.safetensors +3 -0
  40. model-00038-of-00088.safetensors +3 -0
  41. model-00039-of-00088.safetensors +3 -0
  42. model-00040-of-00088.safetensors +3 -0
  43. model-00041-of-00088.safetensors +3 -0
  44. model-00042-of-00088.safetensors +3 -0
  45. model-00043-of-00088.safetensors +3 -0
  46. model-00044-of-00088.safetensors +3 -0
  47. model-00045-of-00088.safetensors +3 -0
  48. model-00046-of-00088.safetensors +3 -0
  49. model-00047-of-00088.safetensors +3 -0
  50. model-00048-of-00088.safetensors +3 -0
README.md CHANGED
@@ -1,3 +1,33 @@
1
  ---
2
  license: apache-2.0
 
 
 
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
  license: apache-2.0
3
+ tags:
4
+ - mlx
5
+ base_model: GreenBitAI/DeepSeek-V3-0324-671B-layer-mix-bpw-4.0
6
  ---
7
+
8
+ # GreenBitAI/DeepSeek-V3-0324-671B-layer-mix-bpw-4.0-mlx
9
+
10
+ This quantized low-bit model [GreenBitAI/DeepSeek-V3-0324-671B-layer-mix-bpw-4.0-mlx](https://huggingface.co/GreenBitAI/DeepSeek-V3-0324-671B-layer-mix-bpw-4.0-mlx) was converted to MLX format from [`GreenBitAI/DeepSeek-V3-0324-671B-layer-mix-bpw-4.0`](https://huggingface.co/GreenBitAI/DeepSeek-V3-0324-671B-layer-mix-bpw-4.0) using gbx-lm version **0.4.0**.
11
+ Refer to the [original model card](https://huggingface.co/GreenBitAI/DeepSeek-V3-0324-671B-layer-mix-bpw-4.0) for more details on the model.
12
+
13
+ ## Use with mlx
14
+
15
+ ```bash
16
+ pip install gbx-lm
17
+ ```
18
+
19
+ ```python
20
+ from gbx_lm import load, generate
21
+
22
+ model, tokenizer = load("GreenBitAI/DeepSeek-V3-0324-671B-layer-mix-bpw-4.0-mlx")
23
+
24
+ prompt = "hello"
25
+
26
+ if tokenizer.chat_template is not None:
27
+ messages = [{"role": "user", "content": prompt}]
28
+ prompt = tokenizer.apply_chat_template(
29
+ messages, add_generation_prompt=True
30
+ )
31
+
32
+ response = generate(model, tokenizer, prompt=prompt, verbose=True)
33
+ ```
config.json ADDED
@@ -0,0 +1,71 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "DeepseekV3ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "auto_map": {
8
+ "AutoConfig": "configuration_deepseek.DeepseekV3Config",
9
+ "AutoModel": "modeling_deepseek.DeepseekV3Model",
10
+ "AutoModelForCausalLM": "modeling_deepseek.DeepseekV3ForCausalLM"
11
+ },
12
+ "bos_token_id": 0,
13
+ "eos_token_id": 1,
14
+ "ep_size": 1,
15
+ "first_k_dense_replace": 3,
16
+ "hidden_act": "silu",
17
+ "hidden_size": 7168,
18
+ "initializer_range": 0.02,
19
+ "intermediate_size": 18432,
20
+ "kv_lora_rank": 512,
21
+ "max_position_embeddings": 163840,
22
+ "model_type": "deepseek_v3",
23
+ "moe_intermediate_size": 2048,
24
+ "moe_layer_freq": 1,
25
+ "n_group": 8,
26
+ "n_routed_experts": 256,
27
+ "n_shared_experts": 1,
28
+ "norm_topk_prob": true,
29
+ "num_attention_heads": 128,
30
+ "num_experts_per_tok": 8,
31
+ "num_hidden_layers": 61,
32
+ "num_key_value_heads": 128,
33
+ "num_nextn_predict_layers": 1,
34
+ "q_lora_rank": 1536,
35
+ "qk_nope_head_dim": 128,
36
+ "qk_rope_head_dim": 64,
37
+ "quantization": {
38
+ "group_size": null,
39
+ "bits": null
40
+ },
41
+ "quantization_config": {
42
+ "activation_scheme": "dynamic",
43
+ "modules_to_not_convert": null,
44
+ "quant_method": "fp8",
45
+ "weight_block_size": [
46
+ 128,
47
+ 128
48
+ ]
49
+ },
50
+ "rms_norm_eps": 1e-06,
51
+ "rope_scaling": {
52
+ "beta_fast": 32,
53
+ "beta_slow": 1,
54
+ "factor": 40,
55
+ "mscale": 1.0,
56
+ "mscale_all_dim": 1.0,
57
+ "original_max_position_embeddings": 4096,
58
+ "type": "yarn"
59
+ },
60
+ "rope_theta": 10000,
61
+ "routed_scaling_factor": 2.5,
62
+ "scoring_func": "sigmoid",
63
+ "tie_word_embeddings": false,
64
+ "topk_group": 4,
65
+ "topk_method": "noaux_tc",
66
+ "torch_dtype": "float32",
67
+ "transformers_version": "4.49.0",
68
+ "use_cache": true,
69
+ "v_head_dim": 128,
70
+ "vocab_size": 129280
71
+ }
model-00001-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99dc41075ef08aaf07e96a3a811176c6c56b9dee121617ec59dc143f86194372
3
+ size 4880186243
model-00002-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6752417eaa8c3788a7bf99d9ca61374048ef73a6f835c6f8cc98a85f86e538ed
3
+ size 4119679627
model-00003-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3df79a615c5284b499d3150bbbc5345312a4fa23ccda20a23de9b18e66b31e1
3
+ size 3992978192
model-00004-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c4a1fc3ff2a04a8ea850ec4565290e259ea6e6d6b6942ac638df07935575205
3
+ size 4119679767
model-00005-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d9728ad1722d371b8fbd4c1eeab2c161fc142dd975a3340628db3fdc1f37548
3
+ size 4119679673
model-00006-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e345c519991d928c368e29757e5408d963016557b33ace0eea45df3fac5a7f7f
3
+ size 3992978186
model-00007-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94f083381e8fbbee796599e1ae4b7965850ead256289c6d96eb57002d6be89f9
3
+ size 4119679725
model-00008-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0619a764be657cdab66bcf4faa6a31702e58b51922948e9ca8c342715801aa5d
3
+ size 4119679679
model-00009-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09fe7583a9a6c8a85b5bcbf35cef148a8b3ad0b91527843bef869db828232e71
3
+ size 3992978190
model-00010-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a561f8627974b875aaac37911c6e3a03cd375744f15a2cf9d03a33a9e14bc93
3
+ size 4119679761
model-00011-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b93f1d2041239981a11931ed1d5b80fe33d465683a3d57d1184d786333c4b232
3
+ size 4119679676
model-00012-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0127de0dba15c00f4667f9265735e5b47689b3404566374ceff985fdf3b15167
3
+ size 3992978196
model-00013-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e78d55b2fb20c5f9ed87f0e87eed28c72b9e971eb0dab4f3d2fc3174e875b1d
3
+ size 4119679815
model-00014-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0e791a545d4f271828631b60fb0b188762d2394ffa292ea436c09e1566f95c1
3
+ size 4119679653
model-00015-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc45a3e5731e2b743e4168f0a09e032ac935d40cfff8965b8422d2c30974cc28
3
+ size 3992978196
model-00016-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1bcaff4801b469089e1a079d27389a50832bb4777f1ae05680d09860dbb07dd
3
+ size 4119679715
model-00017-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:326ce3009cf3c1746cf848b15a62a7fdd86429cc17342035990567f0ac0909b5
3
+ size 4119679725
model-00018-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc94dec8a6f6c230c4023fe997df743cdb06f87aeb46278c7f595a7f3f691995
3
+ size 3992978196
model-00019-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eda172a4d2091e5d3ffe256223e213f90b56f8bcdcf4630a741dff00aa32cb4d
3
+ size 4119679751
model-00020-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c893cd7e44fe154a7ea3c478170b97861f78cec888a98f9499c9d3a55ac43f8
3
+ size 4119679697
model-00021-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9d7b74600678fe2df64ae9447d406edaf59232df79ff531741bb9d28675c985
3
+ size 3992978198
model-00022-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16fc8d0653fbbaabf42b9d3c049cdab488797d3b9027ccd8edaf1ad82ad33422
3
+ size 4119679815
model-00023-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2408c5afa448f6d524024ac742b47b8c700bdf75e4dd1ab8f84614e349b117c3
3
+ size 4119679721
model-00024-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b3ea1ce3267de8d5ac86a2c8b4a0ab3398219ac756cb15bed2252ef10225755
3
+ size 3992978196
model-00025-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6888240d3416ef36e929afcdf63214e8fad35270e9383c67fa74478f01940c76
3
+ size 4119679809
model-00026-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5336771339154ecba1b993f7993c32635927f9cca44386e5b38424d9e89fe49c
3
+ size 4119679719
model-00027-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:517089f4508bda187facf1d359cfb256b3bf64dc20f6fd0c5caaf2f1f36bc3d8
3
+ size 3992978196
model-00028-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86d808e0a8941b9ae622b8852659b151a005b898b1485a95754895a7717abbbd
3
+ size 4119679819
model-00029-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9b0f9e443b42be5260c04533eb0115426a5909b33c284572838ed5f7d0918f6
3
+ size 4119679679
model-00030-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c3f93a8f828f213fa0c098c4fe6c36dd6e992c73388be0df3b11f95bb4fbe08
3
+ size 3992978198
model-00031-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12b0b32fd09c2e27d5f970fb0f4da9adc34794401fc7c8f4c7f91a7a9ed7db8d
3
+ size 4119679815
model-00032-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1a0e89b82fe7557c3af0bb0c0112c9289d3b7853b988032aa3744fbb1e96bd3
3
+ size 4119679731
model-00033-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:198a942c4b5aecb05518c1e7f7f59af5dea0a9d881f66c16b9eb1509732a4da8
3
+ size 3992978194
model-00034-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:980c6444ad2cde624aa0477bffd8fc34b55682ffe53eba59b392ed8ba1bbc5b1
3
+ size 4119679819
model-00035-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc9e44bfc5583a99127563358477a49ef8ae1b0c04298deb39dbcbcbdc1fa78f
3
+ size 4119679725
model-00036-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ec16406d89a771929c2bfe831cd4005af8fb011969a82fef9e39b3d3ade1541
3
+ size 3992978198
model-00037-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d60a14d7d33ff07ad5f0a688e429fd45b64d7105bc4b9bbd64b6fafb627a41aa
3
+ size 4119679785
model-00038-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfa00afae5f3191f5e118647fbcfee4f0f4623551b2029e5e4c561e7ee5eb518
3
+ size 4119679679
model-00039-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e8082e8e368bd2acbabf88b551bdea0b8190f44d82c6a9ba1190a462752ede7
3
+ size 3992978194
model-00040-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:829e30d3bee93bb84f4e4ef2af45a9af1298b89c0ee0330a98d96dda348b4310
3
+ size 4119679815
model-00041-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e9cf318a1d47c5df308557bcd2c8bef37158b4eeb00e05fa0dcf45f86dc5052
3
+ size 4119679735
model-00042-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:730e800e041809759727b69e216b66bc08242d476c40538637fa80701bb6d6a3
3
+ size 3992978198
model-00043-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e449cdbf359a3042028ff9cf54599f5392b364e8ba162c70e052c664a3ecb88
3
+ size 4119679813
model-00044-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4481d4dc7dd7f9da7e85daca474d4dd45f0048cd82551c1e80f6d1b64f96d990
3
+ size 4119679703
model-00045-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a65fbf007cdc8b01504546d9a3fd9aeb4ec7a7650da618dced166673ce2bac4d
3
+ size 3992978194
model-00046-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cb963a60e9cda2b641d32e03ea02c2eb32cb9fd42006683ad9037596507ed28
3
+ size 4119679813
model-00047-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b83700c48976a893d400280de5f8bd39b311dcee5e632c8bd5fa1b2dd3632c5
3
+ size 4119679699
model-00048-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e16c2ebdec9413a9194a7eb58c7291dfc86f76d6a1307d26065cd10b22b1a70
3
+ size 3992978198