Upload folder using huggingface_hub

#1
by awni - opened
This view is limited to 50 files because it contains too many changes.  See the raw diff here.
Files changed (50) hide show
  1. README.md +33 -0
  2. config.json +69 -0
  3. model-00001-of-00070.safetensors +3 -0
  4. model-00002-of-00070.safetensors +3 -0
  5. model-00003-of-00070.safetensors +3 -0
  6. model-00004-of-00070.safetensors +3 -0
  7. model-00005-of-00070.safetensors +3 -0
  8. model-00006-of-00070.safetensors +3 -0
  9. model-00007-of-00070.safetensors +3 -0
  10. model-00008-of-00070.safetensors +3 -0
  11. model-00009-of-00070.safetensors +3 -0
  12. model-00010-of-00070.safetensors +3 -0
  13. model-00011-of-00070.safetensors +3 -0
  14. model-00012-of-00070.safetensors +3 -0
  15. model-00013-of-00070.safetensors +3 -0
  16. model-00014-of-00070.safetensors +3 -0
  17. model-00015-of-00070.safetensors +3 -0
  18. model-00016-of-00070.safetensors +3 -0
  19. model-00017-of-00070.safetensors +3 -0
  20. model-00018-of-00070.safetensors +3 -0
  21. model-00019-of-00070.safetensors +3 -0
  22. model-00020-of-00070.safetensors +3 -0
  23. model-00021-of-00070.safetensors +3 -0
  24. model-00022-of-00070.safetensors +3 -0
  25. model-00023-of-00070.safetensors +3 -0
  26. model-00024-of-00070.safetensors +3 -0
  27. model-00025-of-00070.safetensors +3 -0
  28. model-00026-of-00070.safetensors +3 -0
  29. model-00027-of-00070.safetensors +3 -0
  30. model-00028-of-00070.safetensors +3 -0
  31. model-00029-of-00070.safetensors +3 -0
  32. model-00030-of-00070.safetensors +3 -0
  33. model-00031-of-00070.safetensors +3 -0
  34. model-00032-of-00070.safetensors +3 -0
  35. model-00033-of-00070.safetensors +3 -0
  36. model-00034-of-00070.safetensors +3 -0
  37. model-00035-of-00070.safetensors +3 -0
  38. model-00036-of-00070.safetensors +3 -0
  39. model-00037-of-00070.safetensors +3 -0
  40. model-00038-of-00070.safetensors +3 -0
  41. model-00039-of-00070.safetensors +3 -0
  42. model-00040-of-00070.safetensors +3 -0
  43. model-00041-of-00070.safetensors +3 -0
  44. model-00042-of-00070.safetensors +3 -0
  45. model-00043-of-00070.safetensors +3 -0
  46. model-00044-of-00070.safetensors +3 -0
  47. model-00045-of-00070.safetensors +3 -0
  48. model-00046-of-00070.safetensors +3 -0
  49. model-00047-of-00070.safetensors +3 -0
  50. model-00048-of-00070.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: deepseek-ai/DeepSeek-V3
3
+ tags:
4
+ - mlx
5
+ ---
6
+
7
+ # mlx-community/DeepSeek-V3-3bit
8
+
9
+ The Model [mlx-community/DeepSeek-V3-3bit](https://huggingface.co/mlx-community/DeepSeek-V3-3bit) was
10
+ converted to MLX format from [deepseek-ai/DeepSeek-V3](https://huggingface.co/deepseek-ai/DeepSeek-V3)
11
+ using mlx-lm version **0.20.4**.
12
+
13
+ ## Use with mlx
14
+
15
+ ```bash
16
+ pip install mlx-lm
17
+ ```
18
+
19
+ ```python
20
+ from mlx_lm import load, generate
21
+
22
+ model, tokenizer = load("mlx-community/DeepSeek-V3-3bit")
23
+
24
+ prompt="hello"
25
+
26
+ if tokenizer.chat_template is not None:
27
+ messages = [{"role": "user", "content": prompt}]
28
+ prompt = tokenizer.apply_chat_template(
29
+ messages, add_generation_prompt=True
30
+ )
31
+
32
+ response = generate(model, tokenizer, prompt=prompt, verbose=True)
33
+ ```
config.json ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "DeepseekV3ForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "auto_map": {
8
+ "AutoConfig": "configuration_deepseek.DeepseekV3Config",
9
+ "AutoModel": "modeling_deepseek.DeepseekV3Model",
10
+ "AutoModelForCausalLM": "modeling_deepseek.DeepseekV3ForCausalLM"
11
+ },
12
+ "aux_loss_alpha": 0.001,
13
+ "bos_token_id": 0,
14
+ "eos_token_id": 1,
15
+ "ep_size": 1,
16
+ "first_k_dense_replace": 3,
17
+ "hidden_act": "silu",
18
+ "hidden_size": 7168,
19
+ "initializer_range": 0.02,
20
+ "intermediate_size": 18432,
21
+ "kv_lora_rank": 512,
22
+ "max_position_embeddings": 163840,
23
+ "model_type": "deepseek_v3",
24
+ "moe_intermediate_size": 2048,
25
+ "moe_layer_freq": 1,
26
+ "n_group": 8,
27
+ "n_routed_experts": 256,
28
+ "n_shared_experts": 1,
29
+ "norm_topk_prob": true,
30
+ "num_attention_heads": 128,
31
+ "num_experts_per_tok": 8,
32
+ "num_hidden_layers": 61,
33
+ "num_key_value_heads": 128,
34
+ "num_nextn_predict_layers": 1,
35
+ "pretraining_tp": 1,
36
+ "q_lora_rank": 1536,
37
+ "qk_nope_head_dim": 128,
38
+ "qk_rope_head_dim": 64,
39
+ "quantization": {
40
+ "group_size": 32,
41
+ "bits": 3
42
+ },
43
+ "quantization_config": {
44
+ "group_size": 32,
45
+ "bits": 3
46
+ },
47
+ "rms_norm_eps": 1e-06,
48
+ "rope_scaling": {
49
+ "beta_fast": 32,
50
+ "beta_slow": 1,
51
+ "factor": 40,
52
+ "mscale": 1.0,
53
+ "mscale_all_dim": 1.0,
54
+ "original_max_position_embeddings": 4096,
55
+ "type": "yarn"
56
+ },
57
+ "rope_theta": 10000,
58
+ "routed_scaling_factor": 2.5,
59
+ "scoring_func": "sigmoid",
60
+ "seq_aux": true,
61
+ "tie_word_embeddings": false,
62
+ "topk_group": 4,
63
+ "topk_method": "noaux_tc",
64
+ "torch_dtype": "bfloat16",
65
+ "transformers_version": "4.33.1",
66
+ "use_cache": true,
67
+ "v_head_dim": 128,
68
+ "vocab_size": 129280
69
+ }
model-00001-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afb2860e4c2935102ef7d365644a0ff6411a428eccd6a9b6a38ac896c7ecc473
3
+ size 5190304316
model-00002-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a66d7ddbc5d5ad690797b8ccf8469491c1bfdc7309657d77b153b9807b7a089c
3
+ size 5286663082
model-00003-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afc7d53b08417bf7c1456c2e25cbb5cd7d407547e272f3519a444b855e28130d
3
+ size 4347139111
model-00004-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4a558066775a32b8cc05dfa0f434344b8bbbafa737f271dfacd69e3455d0278
3
+ size 5286663080
model-00005-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5367cfc81927ac1e6aaff424bfdf8e926beabb9388b1e8737d443113ac7ff90
3
+ size 4347139063
model-00006-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e065d85484d2a538f1b94b23ee50db14c516db50c63aabe287b5fe776678a7a
3
+ size 5167383441
model-00007-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:892e9696a8da843b8f87aa4e366024e302bbc543242a32c566f108cc9544f0df
3
+ size 4347139109
model-00008-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efa3ea7a726a6c384fb689c44e55a6c377cf1d67f0881075a211d35c98fc23cc
3
+ size 5286663084
model-00009-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2da378bbf9109596c41467324d4c6d23511578d6b90689a8da763662871ecef8
3
+ size 4347139131
model-00010-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7df3d0becbc0f510ba5f9104a54b14c2593ae30fa84922d40bd0e88e0c892d05
3
+ size 5286663069
model-00011-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:212bd4ef0e77344379daa070adaa61d185bd01e78ce34d9c3eadcebd84ece8d3
3
+ size 4347139059
model-00012-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c30fcd7049dd4ff4f60bb6dc85d3cd2297c982b07770461c5f457f63b580a7bf
3
+ size 5167383450
model-00013-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca6e6eb4ff0dd7af33738add770885758313c403178deb2738c9a56d1daa6052
3
+ size 4347139129
model-00014-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:872acb9a415022670daa38727339ec064b573a993bfa2135a1d23cb62b83cea9
3
+ size 5286663083
model-00015-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:322cb2f50c54fff8032ee1ab1b53a87003c0cfccbecb386a6323643d3d8559be
3
+ size 4347139117
model-00016-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a64bc6de9e6e129c8db0a3033f40ff9e5fc8cf980adb6173561e69d6744f5fa9
3
+ size 5286663117
model-00017-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8ec3e07905f195cfc88d17891ada1e9c4444f62e7e2a5c0161647247c47ef76
3
+ size 4347139073
model-00018-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b394b90fc071147bdbaa6a783d87c8f0d2c1f8f3a79ee3975b902f1b1395bf4e
3
+ size 5167383450
model-00019-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2a2067a88176c81f06acfa67a63cd009d7dc92be52587f3d27ae6b12c8597e4
3
+ size 4347139115
model-00020-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:677ceec554d19e8b5b5422dfe211ee1b19ccf78f140a02a60a08cec329fda1b2
3
+ size 5286663117
model-00021-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dff0376be64872bf5ed78d693f5a1ff7789302258f0d2a18f907843e2c99bb6
3
+ size 4347139147
model-00022-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54c696a72cc06275475a0a0f3242b4165dcffafeed8d0bb3e857ca6bd1441f2e
3
+ size 5286663043
model-00023-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31f14ce1352f87d8a66dce2489ceb4fadd980e50adbf3f1ac87e134189f23b84
3
+ size 4347139039
model-00024-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02d5a4967d7e61f1481eabdbf47e90de08df9b50ccbde4a5d8cc87876e052984
3
+ size 5167383446
model-00025-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbedb849b864cf856b9f3149a9ed36cc897b077460fd6c7dd4b6abe8bd2ef62e
3
+ size 4347139147
model-00026-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b4d1480d575ee349d3056d9be11329b123814fb2d6e73f7d357acf8e2f1f1ce
3
+ size 5286663083
model-00027-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef311bb78c316caab108641d1b051a58e7248b082e346df51719cca9f9ad5de4
3
+ size 4347139101
model-00028-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc4903da709dcb8d3cd5c7c3b23a1697d62ccf500f59bb6de91a6aaac75f2794
3
+ size 5286663033
model-00029-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59d225c461042599f3fef5877916bb1497f9e26c4971accce7bb79247b6f3968
3
+ size 4347139073
model-00030-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4dad871e14bb76eee46f4e16c8c5fac7fdf4bbd1e37accf038ccb1bf238577c
3
+ size 5167383450
model-00031-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7024b39396350fae79b657014777167ea8511efb53f9f7bd291d72ceec1f4dc6
3
+ size 4347139147
model-00032-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79ca73c96a2c249d3ecf978ff1929f74220b9e7708f80c474184e5a7bab53f95
3
+ size 5286663107
model-00033-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbf3a2920290ba9da5d077584ed5eb2d017fb3d40d48f18dd2928d5199cd9eb8
3
+ size 4347139149
model-00034-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:612f61d2b995472445735a62faad5924c4847e1c661a5b0eb28886c2b10a9162
3
+ size 5286663117
model-00035-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b72270a46ad113fb8733a668fae36f125b3c3a8d90b3da106b094e69e04c489
3
+ size 4347139091
model-00036-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:094e3dde25610c6e1ccd2db4e353df31b83f3e5ef05b088d5398943bdf215dc3
3
+ size 5167383448
model-00037-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac777081603bba6e8921240fd981d787203342b6c867337bfbace49afbafbd04
3
+ size 4347139141
model-00038-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09dcd8df74c4a98d977d8b6042ef000e132d21937a5df14da76053bda1e2de43
3
+ size 5286663113
model-00039-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19cbc7ae6fb4e085f612cfa1306cd50298edbaa2621e32bfe0d6993183368ca2
3
+ size 4347139109
model-00040-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87dad6f77dc836b6adb8569b10fee02ca0227431cbd136e799dc02335cad403c
3
+ size 5286663117
model-00041-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f053d99d2bad7139316a65fed313c97185d0fe3f6fbd86d5c2799f494c3f1a65
3
+ size 4347139053
model-00042-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79e5b1e144f4aa5330ea5e831ea3b84193f614abc7b65c260c6b0472717cff57
3
+ size 5167383450
model-00043-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b58b46a28440ab45e0c26e67b8d2148b988717736ab085b5f538cbfad033346b
3
+ size 4347139145
model-00044-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37868143896853edc8c8f59db5b9843164795e4b72288471fbd6360ae078ce64
3
+ size 5286663073
model-00045-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c2e27d1c9e9de0f63e2523bf607f84234573dc7d3bffa89443296cdd0565ef6
3
+ size 4347139107
model-00046-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe32640d73a8dbc102bf5b0bd62f63562c51f561fcebd807a977000e129af583
3
+ size 5286663117
model-00047-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63d08186b3108380fe44e022a2e2bd95a64a040d112b14102d9b621ac064f470
3
+ size 4347139081
model-00048-of-00070.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b27fde43ce79bafad98d13f67e85e60a54bccce4643ef11db9c8539bf7dc1b5
3
+ size 5167383450