bdambrosio commited on Apr 14, 2024

Commit

b8eb21f

verified ·

1 Parent(s): 7a96572

Upload 22 files

Browse files

Files changed (22) hide show

cal_data.safetensors +3 -0
config.json +42 -0
generation_config.json +6 -0
job_new.json +0 -0
measurement.json +0 -0
model.safetensors.index.json +0 -0
output-00001-of-00013.safetensors +3 -0
output-00002-of-00013.safetensors +3 -0
output-00003-of-00013.safetensors +3 -0
output-00004-of-00013.safetensors +3 -0
output-00005-of-00013.safetensors +3 -0
output-00006-of-00013.safetensors +3 -0
output-00007-of-00013.safetensors +3 -0
output-00008-of-00013.safetensors +3 -0
output-00009-of-00013.safetensors +3 -0
output-00010-of-00013.safetensors +3 -0
output-00011-of-00013.safetensors +3 -0
output-00012-of-00013.safetensors +3 -0
output-00013-of-00013.safetensors +3 -0
special_tokens_map.json +30 -0
tokenizer.model +3 -0
tokenizer_config.json +44 -0

cal_data.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5c8fcee03ec1cb4b23851a80d561afb8e533dfca7c009761537878c8441c62ab
+size 1884248

config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+    "_name_or_path": "mistral-community/Mixtral-8x22B-v0.1",
+    "architectures": [
+        "MixtralForCausalLM"
+    ],
+    "attention_dropout": 0.0,
+    "bos_token_id": 1,
+    "eos_token_id": 2,
+    "hidden_act": "silu",
+    "hidden_size": 6144,
+    "initializer_range": 0.02,
+    "intermediate_size": 16384,
+    "max_position_embeddings": 65536,
+    "model_type": "mixtral",
+    "num_attention_heads": 48,
+    "num_experts_per_tok": 2,
+    "num_hidden_layers": 56,
+    "num_key_value_heads": 8,
+    "num_local_experts": 8,
+    "output_router_logits": false,
+    "rms_norm_eps": 1e-05,
+    "rope_theta": 1000000,
+    "router_aux_loss_coef": 0.001,
+    "router_jitter_noise": 0.0,
+    "sliding_window": null,
+    "tie_word_embeddings": false,
+    "torch_dtype": "float16",
+    "transformers_version": "4.39.3",
+    "use_cache": true,
+    "vocab_size": 32000,
+    "quantization_config": {
+        "quant_method": "exl2",
+        "version": "0.0.18",
+        "bits": 6.0,
+        "head_bits": 8,
+        "calibration": {
+            "rows": 100,
+            "length": 2048,
+            "dataset": "(default)"
+        }
+    }
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "transformers_version": "4.39.3"
+}

job_new.json ADDED Viewed

The diff for this file is too large to render. See raw diff

measurement.json ADDED Viewed

The diff for this file is too large to render. See raw diff

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

output-00001-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:873ea7282e3b60ee45574951e880b6c917ec800a75cd18b5cba0213682ef576f
+size 8589598584

output-00002-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d8ce1c66a7274958c289793b03a2a2d284f3bd7d9ae1c3ac0fe8b9e5540181ac
+size 8577086984

output-00003-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68acd6a0cd399ff374202aca5997eb6cb0ac5c6a521f040910d031ed42ccc1dd
+size 8570430680

output-00004-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2a7b6c06d4aa66436b1d27ea28748ab0e65f4ea827c2d7a35d587b5b2ba9eb14
+size 8589795448

output-00005-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a650d738e44ac884a220d6c502fb72b127d5b096e24388d4c92c09f5f05f3c8
+size 8567151080

output-00006-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c076d4cede8a9bca2eb10a472c9168280bf3a796e05ffae76ebc804431680672
+size 8585961736

output-00007-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e72ffa4358120f2f43b55ab73b1b81054a78a86a8d3ad229b7d318bd51a07fa
+size 8566364392

output-00008-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a1d41dc53621408670e48e5d282c0a09f2257a8d8e2bdc66d5aba57a795985a7
+size 8566364392

output-00009-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6dcc67400b45743600a265438b423c0a1407eca76ba1a85b428594d274d2ee1b
+size 8574489768

output-00010-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6ef66a4822e38d2c8547665f78b1f69e9befea99ca6f83c1d45a84d6676f61ce
+size 8555353656

output-00011-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:09106da0f14a604725c34d09552eeba60a7a19e944b8c42be60fbd4856325379
+size 8556924912

output-00012-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf5524c43696fe326b1548cfada7be5747d5dcf093d51435659caa82556f886c
+size 8551482560

output-00013-of-00013.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d9dc2ade0688342b3ec80f42eee74b50840b4d32f8b11e6e649a4b2973c234c
+size 2913689928

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
+size 493443

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "add_prefix_space": true,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "additional_special_tokens": [],
+  "bos_token": "<s>",
+  "chat_template": "{%- set message_roles = ['USER', 'ASSISTANT'] -%}\n{%- set ns = namespace(initial_system_message_handled=false, messages=messages) -%}\n{{ bos_token }}\n{%- for message in ns.messages -%}\n  {%- if message['role'] | upper == 'SYSTEM' and not ns.initial_system_message_handled -%}\n    {%- set ns.initial_system_message_handled = true -%}\n    {{'SYSTEM: ' + message['content'] }}\n  {%- elif message['role'] | upper != 'SYSTEM' -%}\n    {%- if (message['role'] | upper == 'USER') != ((loop.index0 - (1 if ns.initial_system_message_handled else 0)) % 2 == 0) -%}\n      {{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}\n    {%- endif -%}\n    {%- if loop.index0 > 0 or ns.initial_system_message_handled -%}\n      {{ '\\n\\n' }}\n    {%- endif -%}\n    {%- if message['role'] | upper == 'USER' -%}\n      {{ 'USER: ' + message['content'] }}\n    {%- elif message['role'] | upper == 'ASSISTANT' -%}\n      {{ 'ASSISTANT: ' + message['content'] + eos_token}}\n    {%- endif -%}\n  {%- endif -%}\n{%- endfor -%}\n",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": false,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<unk>",
+  "sp_model_kwargs": {},
+  "spaces_between_special_tokens": false,
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}