Commit
·
2c5231c
1
Parent(s):
20af8c9
update
Browse files- config.json +2 -2
- generation_config.json +1 -1
- hf_quant_config.json +5 -2
- model-00001-of-00015.safetensors +2 -2
- model-00002-of-00015.safetensors +2 -2
- model-00003-of-00015.safetensors +2 -2
- model-00004-of-00015.safetensors +2 -2
- model-00005-of-00015.safetensors +2 -2
- model-00006-of-00015.safetensors +2 -2
- model-00007-of-00015.safetensors +2 -2
- model-00008-of-00015.safetensors +2 -2
- model-00009-of-00015.safetensors +2 -2
- model-00010-of-00015.safetensors +2 -2
- model-00011-of-00015.safetensors +2 -2
- model-00012-of-00015.safetensors +2 -2
- model-00013-of-00015.safetensors +2 -2
- model-00014-of-00015.safetensors +2 -2
- model-00015-of-00015.safetensors +2 -2
- model.safetensors.index.json +0 -0
- special_tokens_map.json +0 -0
- tokenizer.json +0 -0
- tokenizer_config.json +1 -0
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "/opt/
|
3 |
"architectures": [
|
4 |
"LlamaForCausalLM"
|
5 |
],
|
@@ -33,7 +33,7 @@
|
|
33 |
"rope_theta": 500000.0,
|
34 |
"tie_word_embeddings": false,
|
35 |
"torch_dtype": "bfloat16",
|
36 |
-
"transformers_version": "4.
|
37 |
"use_cache": true,
|
38 |
"vocab_size": 128256
|
39 |
}
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "/opt/zhiyu_hf_ckpts/Llama-3.1-70B-Instruct/",
|
3 |
"architectures": [
|
4 |
"LlamaForCausalLM"
|
5 |
],
|
|
|
33 |
"rope_theta": 500000.0,
|
34 |
"tie_word_embeddings": false,
|
35 |
"torch_dtype": "bfloat16",
|
36 |
+
"transformers_version": "4.44.0",
|
37 |
"use_cache": true,
|
38 |
"vocab_size": 128256
|
39 |
}
|
generation_config.json
CHANGED
@@ -8,5 +8,5 @@
|
|
8 |
],
|
9 |
"temperature": 0.6,
|
10 |
"top_p": 0.9,
|
11 |
-
"transformers_version": "4.
|
12 |
}
|
|
|
8 |
],
|
9 |
"temperature": 0.6,
|
10 |
"top_p": 0.9,
|
11 |
+
"transformers_version": "4.44.0"
|
12 |
}
|
hf_quant_config.json
CHANGED
@@ -1,10 +1,13 @@
|
|
1 |
{
|
2 |
"producer": {
|
3 |
"name": "modelopt",
|
4 |
-
"version": "0.
|
5 |
},
|
6 |
"quantization": {
|
7 |
"quant_algo": "FP8",
|
8 |
-
"kv_cache_quant_algo":
|
|
|
|
|
|
|
9 |
}
|
10 |
}
|
|
|
1 |
{
|
2 |
"producer": {
|
3 |
"name": "modelopt",
|
4 |
+
"version": "0.23.0"
|
5 |
},
|
6 |
"quantization": {
|
7 |
"quant_algo": "FP8",
|
8 |
+
"kv_cache_quant_algo": "FP8",
|
9 |
+
"exclude_modules": [
|
10 |
+
"lm_head"
|
11 |
+
]
|
12 |
}
|
13 |
}
|
model-00001-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c21fea9c05ad6e00434f3fb73d778d18bb594ac3a7a7bea1a978160227c881a5
|
3 |
+
size 4819363200
|
model-00002-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff18d0fe3c6233c256347080b18a41f8ab1a84ab2954d8d8492f5b1f1cb204a0
|
3 |
+
size 4983044160
|
model-00003-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e61982a1e76fcab453d8318ee1e63c3b8c68b979c86e6a3b0d737db0137a3fa
|
3 |
+
size 4899126392
|
model-00004-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8443516c25f10fba4ea56ef1103bcd53544f8f7b1207476d70824912d5e2685
|
3 |
+
size 4899159416
|
model-00005-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5393156ffbbd9ad3b2a04be5392fd6107b1a734fd8434f2ff9fa989f90ca437
|
3 |
+
size 4899159408
|
model-00006-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a00c83e264c731d4923f7b24bc91f9a2b992472fd524ebde77d7113cdb7b20b
|
3 |
+
size 4983044296
|
model-00007-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf43539ab4ea597ef9759881678942bf8585087121496142eabd0d83cd6bd4f6
|
3 |
+
size 4899126416
|
model-00008-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a5f7e53270acc9d9e35469aa4eb9fe17e743779be0b8e1569ca45f17f6e391d
|
3 |
+
size 4899159416
|
model-00009-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63120d51e50173d75346ba6ef04844d824b5a28a9175dc9001348dff44406557
|
3 |
+
size 4899159408
|
model-00010-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9412ea51371da7a4b1478f347b8274ccadb42d5ca4e83a4af5296c346a862eb4
|
3 |
+
size 4983044296
|
model-00011-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f4f754147e4ad7ce436fb5443df6c0b7b36726495f340bcd133ed42dec4d1a9
|
3 |
+
size 4899126416
|
model-00012-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96ec8ec1cb4d4bfe9bf55870ec3d77b22a9a88ff0eeff428b6141f7907552edc
|
3 |
+
size 4899159416
|
model-00013-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4de8cbec0025d4b86f77060d1cef452a3316c6f61f6c7d3ece01654bd2ae41ce
|
3 |
+
size 4899159408
|
model-00014-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:047841a4f0e868ed1715617b8e35729945e45bc477d3a8f2ddfa479f070d3375
|
3 |
+
size 4983044296
|
model-00015-of-00015.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c430f7ce602a4e4ef70e94baed4b012837903565f7c09c3af40194896ef138a
|
3 |
+
size 3812709816
|
model.safetensors.index.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
special_tokens_map.json
CHANGED
File without changes
|
tokenizer.json
CHANGED
File without changes
|
tokenizer_config.json
CHANGED
@@ -2058,5 +2058,6 @@
|
|
2058 |
"attention_mask"
|
2059 |
],
|
2060 |
"model_max_length": 131072,
|
|
|
2061 |
"tokenizer_class": "PreTrainedTokenizerFast"
|
2062 |
}
|
|
|
2058 |
"attention_mask"
|
2059 |
],
|
2060 |
"model_max_length": 131072,
|
2061 |
+
"pad_token": "<|eot_id|>",
|
2062 |
"tokenizer_class": "PreTrainedTokenizerFast"
|
2063 |
}
|