Jeethu commited on
Commit
14b9c8a
·
1 Parent(s): 012b11d

Add weights

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
README.md CHANGED
@@ -1,3 +1,13 @@
1
  ---
2
  license: mit
 
 
 
 
 
 
 
 
3
  ---
 
 
 
1
  ---
2
  license: mit
3
+ language:
4
+ - en
5
+ base_model: deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
6
+ base_model_relation: quantized
7
+ library_name: mlc-llm
8
+ pipeline_tag: text-generation
9
+ tags:
10
+ - chat
11
  ---
12
+
13
+ 4-bit GPTQ quantized version of [DeepSeek-R1-Distill-Qwen-7B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B).
mlc-chat-config.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen2",
4
+ "quantization": "GPTQ-Int4",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 3584,
8
+ "intermediate_size": 18944,
9
+ "num_attention_heads": 28,
10
+ "num_hidden_layers": 28,
11
+ "num_key_value_heads": 4,
12
+ "rms_norm_eps": 1e-06,
13
+ "rope_theta": 10000,
14
+ "vocab_size": 152064,
15
+ "tie_word_embeddings": false,
16
+ "context_window_size": 8192,
17
+ "prefill_chunk_size": 128,
18
+ "tensor_parallel_shards": 1,
19
+ "head_dim": 128,
20
+ "dtype": "float32",
21
+ "max_batch_size": 128
22
+ },
23
+ "vocab_size": 152064,
24
+ "context_window_size": 8192,
25
+ "sliding_window_size": -1,
26
+ "prefill_chunk_size": 128,
27
+ "attention_sink_size": -1,
28
+ "tensor_parallel_shards": 1,
29
+ "pipeline_parallel_stages": 1,
30
+ "temperature": 1.0,
31
+ "presence_penalty": 0.0,
32
+ "frequency_penalty": 0.0,
33
+ "repetition_penalty": 1.0,
34
+ "top_p": 1.0,
35
+ "tokenizer_files": [
36
+ "tokenizer.json",
37
+ "tokenizer_config.json"
38
+ ],
39
+ "tokenizer_info": {
40
+ "token_postproc_method": "byte_level",
41
+ "prepend_space_in_encode": false,
42
+ "strip_space_in_decode": false
43
+ },
44
+ "conv_template": {
45
+ "name": "deepseek_r1_qwen",
46
+ "system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
47
+ "system_message": "You are a helpful assistant.",
48
+ "system_prefix_token_ids": null,
49
+ "add_role_after_system_message": true,
50
+ "roles": {
51
+ "user": "<\uff5cUser\uff5c>",
52
+ "assistant": "<\uff5cAssistant\uff5c>"
53
+ },
54
+ "role_templates": {
55
+ "user": "{user_message}",
56
+ "assistant": "{assistant_message}",
57
+ "tool": "{tool_message}"
58
+ },
59
+ "messages": [],
60
+ "seps": [
61
+ "",
62
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
63
+ ],
64
+ "role_content_sep": "",
65
+ "role_empty_sep": "",
66
+ "stop_str": [],
67
+ "stop_token_ids": [
68
+ 151643
69
+ ],
70
+ "function_string": "",
71
+ "use_function_calling": false
72
+ },
73
+ "pad_token_id": 0,
74
+ "bos_token_id": 151643,
75
+ "eos_token_id": 151643
76
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b617f133c27a1726b6c1ce1cac7176fcc83c6aedd967412bc38b83daa8e0915f
3
+ size 272498688
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1db881b8655fb06fc44a638ac9f6dd450a62fff48528828a69dd45a870932247
3
+ size 67895296
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df26afe2eb1a1d73ffd3626844cb3e8d59f289209d3a07467ce855fdd4eb0831
3
+ size 33947648
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae11f8114c132921e093c6a5ec5604237ecd495ee5319b2258d71daa75673df8
3
+ size 30066688
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d0db054ecf16a4370608ea4f11f3c9d287d92921b1b3eaa435b63befdc9c992
3
+ size 67895296
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3155f44e590254bf404be7de1072baf9662e0934084949d6ada04fa93a9ea3cc
3
+ size 33947648
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc82a1845a8ff345ecb266bb49080b336cac4046c4b212493bca472e28e9cf85
3
+ size 67895296
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5165b7c8096d0bca4d6bcafca95d0b9fa5724b62320b73014e19234f2f86054f
3
+ size 33947648
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:518c5a92a535dac36ea0b5b4c3533e2198ff34200b33071ea6b215f545673ea8
3
+ size 28174336
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8738d3872a9d8d654bd3c5907ecbb00a573236499267519f1bd022f1645cfa2a
3
+ size 67895296
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7102f1eb50167ec7b28af9fbe833fcc76ac38c01cea8601bab952ebecaf302e
3
+ size 33947648
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a073d31d44413fbbe23588a64585289f7fe5cbc45e1eb4663bd10abd3b3342b6
3
+ size 67895296
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b901fe53a32802ec9a3361f2619c07668a65251d9aff7881385e6b521852aca8
3
+ size 33947648
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55edefea1050e3ac3f923f4595ef5d4c59542a0f976c443edc384f1d74a803ac
3
+ size 33483776
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f205a70b6f87605b65cf396714951af8a265f5af7d7cbc353d2d18d6240529c
3
+ size 33947648
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b8de19753a24ceb520f198d2a1e638f9cb4ccc9e306a2e94debe19242f38da9
3
+ size 67895296
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a7fb8603344135dfeee0f9aa776845664f9d99303a3ccdecc40ccc8484c5fe3
3
+ size 33947648
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f8cf1554b850dc8ad5abb2ba8affc71dd5fbb4a003161ee18dc8a882f57612f
3
+ size 30066688
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29bc07af8532c4f36bc459558b449f7e616728541bf4b439424e4d3e58d9ffa0
3
+ size 67895296
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2a1ccb1c5f25050bdffe3a029b9c238cc647ac02fca4216a9aa3ba16cf4e0d2
3
+ size 33947648
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:354cddf723aaf7406529444a8d9884c595be0b585258a61f9ba0490712cec809
3
+ size 67895296
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c3941e449eac9c2820b89b1a0e76d3f60097cdbe1d5bc91a55e9a0317c2bcba
3
+ size 33947648
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:734dd2e9dbb89fd3bb5bec277ba6f472cb0811b8049ed421ce89a76eaec83682
3
+ size 28174336
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dbb1dc1bc81e9bdd2e4ac023c79c26052fc33998ceb1aa35b37bd0d71ccc2c7
3
+ size 26869760
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5843300eac1810ce4a8b1edac353777df72fb323d29fb768d165d1f7f475c6b3
3
+ size 67895296
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ae90d396e202eacf69e04b22af6e3ec2556cbb3e91d36cc7bac25ecf2e0593e
3
+ size 33947648
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9fb95b0b63e11de8121db66d1d0655da2df41d65d3f595aab28282f1e4d0068
3
+ size 67895296
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d0a062fe33b3e974dc1e93a20ac33cbf41c32eae17b6c5f33e495c5b4e7bc2f
3
+ size 33483776
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc395fbd9695226a52a06cb305dd41dcaa78f2ea2c7b9d286f544c66d26f8ec3
3
+ size 33947648
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7e750ddcccafc47f7867d5fe33753a89c1ce66c95aa2b89d52534ef7d81f5cf
3
+ size 67895296
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b1cfad9b201ddaaf216624937cb0c56eb7747f3394a871a61d044299e3edc2e
3
+ size 33947648
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31cdcf18c86065eda444d54d0f7eba207a9510bae9498dbfa181054f7183fb58
3
+ size 30066688
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:422fb44dc280d47020cad1fd70ed16891421c7fa39dc652742295d529df73a12
3
+ size 67895296
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:533a8b24cebc7c420c030791010909c420e4624426989eb1c1db0da49cab5548
3
+ size 33947648
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05652421ae69a7bcb303e398beff11d7c288a899009d02b64e506a8fe26542c5
3
+ size 67895296
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dbf02c152fb77841b743c58f336765c5c61a56eeec04f111d42d40c099f16f5
3
+ size 67895296
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebfbb94555d84328f86e75a1e0e9046aee54aebc61b5325d400dbc428c32b0a1
3
+ size 33947648
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f1a45b7ad0844843bfc36f47de172200a0b26e9dad180a35ff9710752a3bbb0
3
+ size 28174336
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b797f0db2ca30f2d4d0a239cffd4457a35f55db7607d48547c94915962c202d9
3
+ size 67895296
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ac3104425e7c1112a56dd44e96b4e8d3158233b8c26523efbde206d08855497
3
+ size 33947648
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be31ddafbd7954b737ad6a8d42dc1209878967a89f6b3c6e7db165eaeda9f969
3
+ size 67895296
params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d2b006506d0a0156ca274c89028b0a0e6c906961101aa7488e97c3ed5b45e24
3
+ size 33483776
params_shard_47.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ed68bcf655ce74065a769e912f60a2c54c33a288d4f6f0803e7c6c65265c010
3
+ size 33947648
params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00bf9f10c0f1a9ad77ce7cc4281f871c91afd68d2328e9c44acd491b7682fafb
3
+ size 67895296
params_shard_49.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13327365f13d35b6ba43dc51a920a81a4b67e239c190ccad0e42e7223e0bb7ba
3
+ size 33947648
params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cb57d58cafa4540296036277635120fb58bb91798fda1e766c372ab84d1dc59
3
+ size 33947648
params_shard_50.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e94f6c9a11143cea127a92b725ec1a6e042a62ece77a0995eaf7bc09aa6d7c1d
3
+ size 30066688