NicoNico commited on
Commit
be59f39
·
verified ·
1 Parent(s): 2aeae00

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +34 -0
  2. config.json +74 -0
  3. model-00001-of-00088.safetensors +3 -0
  4. model-00002-of-00088.safetensors +3 -0
  5. model-00003-of-00088.safetensors +3 -0
  6. model-00004-of-00088.safetensors +3 -0
  7. model-00005-of-00088.safetensors +3 -0
  8. model-00006-of-00088.safetensors +3 -0
  9. model-00007-of-00088.safetensors +3 -0
  10. model-00008-of-00088.safetensors +3 -0
  11. model-00009-of-00088.safetensors +3 -0
  12. model-00010-of-00088.safetensors +3 -0
  13. model-00011-of-00088.safetensors +3 -0
  14. model-00012-of-00088.safetensors +3 -0
  15. model-00013-of-00088.safetensors +3 -0
  16. model-00014-of-00088.safetensors +3 -0
  17. model-00015-of-00088.safetensors +3 -0
  18. model-00016-of-00088.safetensors +3 -0
  19. model-00017-of-00088.safetensors +3 -0
  20. model-00018-of-00088.safetensors +3 -0
  21. model-00019-of-00088.safetensors +3 -0
  22. model-00020-of-00088.safetensors +3 -0
  23. model-00021-of-00088.safetensors +3 -0
  24. model-00022-of-00088.safetensors +3 -0
  25. model-00023-of-00088.safetensors +3 -0
  26. model-00024-of-00088.safetensors +3 -0
  27. model-00025-of-00088.safetensors +3 -0
  28. model-00026-of-00088.safetensors +3 -0
  29. model-00027-of-00088.safetensors +3 -0
  30. model-00028-of-00088.safetensors +3 -0
  31. model-00029-of-00088.safetensors +3 -0
  32. model-00030-of-00088.safetensors +3 -0
  33. model-00031-of-00088.safetensors +3 -0
  34. model-00032-of-00088.safetensors +3 -0
  35. model-00033-of-00088.safetensors +3 -0
  36. model-00034-of-00088.safetensors +3 -0
  37. model-00035-of-00088.safetensors +3 -0
  38. model-00036-of-00088.safetensors +3 -0
  39. model-00037-of-00088.safetensors +3 -0
  40. model-00038-of-00088.safetensors +3 -0
  41. model-00039-of-00088.safetensors +3 -0
  42. model-00040-of-00088.safetensors +3 -0
  43. model-00041-of-00088.safetensors +3 -0
  44. model-00042-of-00088.safetensors +3 -0
  45. model-00043-of-00088.safetensors +3 -0
  46. model-00044-of-00088.safetensors +3 -0
  47. model-00045-of-00088.safetensors +3 -0
  48. model-00046-of-00088.safetensors +3 -0
  49. model-00047-of-00088.safetensors +3 -0
  50. model-00048-of-00088.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - mlx
5
+ - mlx
6
+ base_model: GreenBitAI/DeepSeek-R1-671B-layer-mix-bpw-4.0
7
+ ---
8
+
9
+ # GreenBitAI/DeepSeek-R1-671B-layer-mix-bpw-4.0-mlx
10
+
11
+ This quantized low-bit model [GreenBitAI/DeepSeek-R1-671B-layer-mix-bpw-4.0-mlx](https://huggingface.co/GreenBitAI/DeepSeek-R1-671B-layer-mix-bpw-4.0-mlx) was converted to MLX format from [`GreenBitAI/DeepSeek-R1-671B-layer-mix-bpw-4.0`](https://huggingface.co/GreenBitAI/DeepSeek-R1-671B-layer-mix-bpw-4.0) using gbx-lm version **0.4.0**.
12
+ Refer to the [original model card](https://huggingface.co/GreenBitAI/DeepSeek-R1-671B-layer-mix-bpw-4.0) for more details on the model.
13
+
14
+ ## Use with mlx
15
+
16
+ ```bash
17
+ pip install gbx-lm
18
+ ```
19
+
20
+ ```python
21
+ from gbx_lm import load, generate
22
+
23
+ model, tokenizer = load("GreenBitAI/DeepSeek-R1-671B-layer-mix-bpw-4.0-mlx")
24
+
25
+ prompt = "hello"
26
+
27
+ if tokenizer.chat_template is not None:
28
+ messages = [{"role": "user", "content": prompt}]
29
+ prompt = tokenizer.apply_chat_template(
30
+ messages, add_generation_prompt=True
31
+ )
32
+
33
+ response = generate(model, tokenizer, prompt=prompt, verbose=True)
34
+ ```
config.json ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "DeepseekV3ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "auto_map": {
8
+ "AutoConfig": "configuration_deepseek.DeepseekV3Config",
9
+ "AutoModel": "modeling_deepseek.DeepseekV3Model",
10
+ "AutoModelForCausalLM": "modeling_deepseek.DeepseekV3ForCausalLM"
11
+ },
12
+ "aux_loss_alpha": 0.001,
13
+ "bos_token_id": 0,
14
+ "eos_token_id": 1,
15
+ "ep_size": 1,
16
+ "first_k_dense_replace": 3,
17
+ "hidden_act": "silu",
18
+ "hidden_size": 7168,
19
+ "initializer_range": 0.02,
20
+ "intermediate_size": 18432,
21
+ "kv_lora_rank": 512,
22
+ "max_position_embeddings": 163840,
23
+ "model_type": "deepseek_v3",
24
+ "moe_intermediate_size": 2048,
25
+ "moe_layer_freq": 1,
26
+ "n_group": 8,
27
+ "n_routed_experts": 256,
28
+ "n_shared_experts": 1,
29
+ "norm_topk_prob": true,
30
+ "num_attention_heads": 128,
31
+ "num_experts_per_tok": 8,
32
+ "num_hidden_layers": 61,
33
+ "num_key_value_heads": 128,
34
+ "num_nextn_predict_layers": 1,
35
+ "pretraining_tp": 1,
36
+ "q_lora_rank": 1536,
37
+ "qk_nope_head_dim": 128,
38
+ "qk_rope_head_dim": 64,
39
+ "quantization": {
40
+ "group_size": null,
41
+ "bits": null
42
+ },
43
+ "quantization_config": {
44
+ "activation_scheme": "dynamic",
45
+ "modules_to_not_convert": null,
46
+ "quant_method": "fp8",
47
+ "weight_block_size": [
48
+ 128,
49
+ 128
50
+ ]
51
+ },
52
+ "rms_norm_eps": 1e-06,
53
+ "rope_scaling": {
54
+ "beta_fast": 32,
55
+ "beta_slow": 1,
56
+ "factor": 40,
57
+ "mscale": 1.0,
58
+ "mscale_all_dim": 1.0,
59
+ "original_max_position_embeddings": 4096,
60
+ "type": "yarn"
61
+ },
62
+ "rope_theta": 10000,
63
+ "routed_scaling_factor": 2.5,
64
+ "scoring_func": "sigmoid",
65
+ "seq_aux": true,
66
+ "tie_word_embeddings": false,
67
+ "topk_group": 4,
68
+ "topk_method": "noaux_tc",
69
+ "torch_dtype": "float32",
70
+ "transformers_version": "4.49.0",
71
+ "use_cache": true,
72
+ "v_head_dim": 128,
73
+ "vocab_size": 129280
74
+ }
model-00001-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dbeed36029b5765e4b6f7f8138f537753f4c603ef9ce909aed53ece6f750581
3
+ size 4880186214
model-00002-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49b713f9c751a06cb4718bae3c3a0d81ebd2f97dbb3a95debab5593daf617c3a
3
+ size 4119679619
model-00003-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b57ba81c6037672ca689f4c5ed0a098d897549f1c599f725087381f939c039a6
3
+ size 3992978192
model-00004-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f07709ba02fc398679ac8b2b1e8e572c5f844d2b167b8e127868c476af5684af
3
+ size 4119679759
model-00005-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bb8d0ddc6dbcbde0736b998a66eff8ddb9343167ec64b955e96cefc16be33bb
3
+ size 4119679665
model-00006-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd57e2837994f73f48d0c3aefe66dff46374c72cb8dc6b48a33801a751d1c3fd
3
+ size 3992978186
model-00007-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:044bc89b254bdb551d8aa40840ec75eb917ed32450d586bf0c8458e878d84fc3
3
+ size 4119679717
model-00008-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:963a64c86b26f49722a974b7886b5472a89c7a46a465d0ea2275bceb8af6a53f
3
+ size 4119679671
model-00009-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5352fb9adc3e04f4993b00af5e9f869dc3b890907dfe1533f9d042bd04e186d
3
+ size 3992978190
model-00010-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1c37389bb964969e3898c0f7529461198c285eee4ac0ed5ebed0a8c64041e90
3
+ size 4119679753
model-00011-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e38d02a2f9b57d405253f7c538002489c0bba71f15ed44043427609603369b80
3
+ size 4119679668
model-00012-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02f8bc5d9d18bc48b94634593101a029a3e2785f55c23a31ff3c2f62033838c2
3
+ size 3992978196
model-00013-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f99ad69d3a838b54ad2bddeb1898c3d9ecb627e37d3b6ea4ba2f809a4124f28
3
+ size 4119679807
model-00014-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4898f9ca5e8b82420a02f69750afa1934e333fde653aee6c64d3248bf43635ca
3
+ size 4119679645
model-00015-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c9bdf13c1f4f831700f0773caf154726c0994deb4441b4e1f5ab571a1c50765
3
+ size 3992978196
model-00016-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:311187179b996d36df779ddfc8e6741e8d90c20dd5749dc6af183ddf33f841c3
3
+ size 4119679707
model-00017-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90ae81ffcf09006197839c513df9042e05769df81385c3f37a864da3101f427e
3
+ size 4119679717
model-00018-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40bedea2aae04b8561293ad3f2041b32ff3ba6af9afe7982ba1077d0f7a6357c
3
+ size 3992978196
model-00019-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a453a0956af30b9ad5176aceb984cd96b6b6289d27a06e0851b2376b7997c61
3
+ size 4119679743
model-00020-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:891e4246a9dccd8a6630b522c5e77dadfdbd6e52058c891d2c886565f91d40af
3
+ size 4119679689
model-00021-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:957ebec23489247e07d836c1aa4b1c32355e778099584117338e9d8374bd8b88
3
+ size 3992978198
model-00022-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f2cba763fe205d4bad16e12167e636dc76e45e8be97dab7a0bd5e877637eee8
3
+ size 4119679807
model-00023-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a95373052eab76adf90c753996f97ee487d3aab783048e3b7cc5ba3150b2e8c
3
+ size 4119679713
model-00024-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:305b9d2d818dffbf696f595ee971451f28ec38bba59e9b8e9c0e71c79228d279
3
+ size 3992978196
model-00025-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c90fd6ba94a837f3950f6fad6ef6a91fda5021e4cf9c2432c75bd0f0b29ae9c
3
+ size 4119679801
model-00026-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc5df2aed401f370d5d948915dc9719867f27baeaeb1f9c26c6c0b9f8ddbd066
3
+ size 4119679711
model-00027-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bce411b6f688d3c2fee499b8ef336cff42fb1971b354e4d2d1c94ea702450474
3
+ size 3992978196
model-00028-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78a86d597309be8d79b059b0dfc2d9aff314d99fd01d07fe09bcb1afdedc0ce7
3
+ size 4119679811
model-00029-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c421d0175e98b2a405f9a7dfe292ec9657c69cba64828b1edeea00196decc09
3
+ size 4119679671
model-00030-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b15865845ae0f8e14dd899be167b44411328d734468440b4eb6cc18f985723c5
3
+ size 3992978198
model-00031-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edc4ac903953b8b36d4760867378406c02b454e15d6f9e0dbceb5594355c82ab
3
+ size 4119679807
model-00032-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:937fc4225e5779ac471e069dae193ddcf88a691382bff60cd77f7f64b61a8e42
3
+ size 4119679723
model-00033-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0b307ca6138828523731464bff64c67a41a7c36a48e4cb7ba17d22de3a14d03
3
+ size 3992978194
model-00034-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af408148c48db1ebb78863de26b12d811c08aeb05e9142744752237d109e1f83
3
+ size 4119679811
model-00035-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:136e973c031799c3033185a2a480da9aacaf5583e509682e636f1068e8f04835
3
+ size 4119679717
model-00036-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c324f8936e6087afaebe075afef9f37723d0621bfda81bd616b4149602412007
3
+ size 3992978198
model-00037-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dc1f3ba4659a4ed7269ee8c8a3b1f17d038747e54052d5ef576f8591b01e371
3
+ size 4119679777
model-00038-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd781caa31559fe0147f7046ff9424585c52613dc91c793aace219cca164a5a8
3
+ size 4119679671
model-00039-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:359370d61f9bca694f2d999af75490442fdb610c2fa3f83db83ba9d12ce61fea
3
+ size 3992978194
model-00040-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c6bf57498b3b98d348eabbc719668ac8e400641542e8a4847ede81b82ecb678
3
+ size 4119679807
model-00041-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab16389e1ab9008c100a9126ac8ff53f84dc75492bcaca9bddeff96840534832
3
+ size 4119679727
model-00042-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b381c2cc314240b3c30e07ca56dd2657a7ae14a1d63ef701705fcda82157a225
3
+ size 3992978198
model-00043-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef5ef2319353f87b16a8b3d8daeff49ebee97e585f8658b713f13dc09686ad48
3
+ size 4119679805
model-00044-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ac7fefcf567741f6917d69704c5522bc62b31763022a25ee04a561921ffae22
3
+ size 4119679695
model-00045-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20c7309f4f090ae89bf06ad2224d4ecdd99189e6c7312b1cc135969d2eedd8eb
3
+ size 3992978194
model-00046-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56794d664272a064b08c26b5c62fab35316a098f8962f3ed19179f2ab2e5ceb5
3
+ size 4119679805
model-00047-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c194c9612e7148cffffb4fe746154db7aa37869e43d90813c4d63a2bce34951
3
+ size 4119679691
model-00048-of-00088.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f03d9401cf1492ec19ccbb19c8e44a6725eb2ebe580f02e63188220956692833
3
+ size 3992978198