mashleburneded
commited on
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +32 -0
- mergekit_moe_config.yml +8 -0
- model-00001-of-00085.safetensors +3 -0
- model-00002-of-00085.safetensors +3 -0
- model-00003-of-00085.safetensors +3 -0
- model-00004-of-00085.safetensors +3 -0
- model-00005-of-00085.safetensors +3 -0
- model-00006-of-00085.safetensors +3 -0
- model-00007-of-00085.safetensors +3 -0
- model-00008-of-00085.safetensors +3 -0
- model-00009-of-00085.safetensors +3 -0
- model-00010-of-00085.safetensors +3 -0
- model-00011-of-00085.safetensors +3 -0
- model-00012-of-00085.safetensors +3 -0
- model-00013-of-00085.safetensors +3 -0
- model-00014-of-00085.safetensors +3 -0
- model-00015-of-00085.safetensors +3 -0
- model-00016-of-00085.safetensors +3 -0
- model-00017-of-00085.safetensors +3 -0
- model-00018-of-00085.safetensors +3 -0
- model-00019-of-00085.safetensors +3 -0
- model-00020-of-00085.safetensors +3 -0
- model-00021-of-00085.safetensors +3 -0
- model-00022-of-00085.safetensors +3 -0
- model-00023-of-00085.safetensors +3 -0
- model-00024-of-00085.safetensors +3 -0
- model-00025-of-00085.safetensors +3 -0
- model-00026-of-00085.safetensors +3 -0
- model-00027-of-00085.safetensors +3 -0
- model-00028-of-00085.safetensors +3 -0
- model-00029-of-00085.safetensors +3 -0
- model-00030-of-00085.safetensors +3 -0
- model-00031-of-00085.safetensors +3 -0
- model-00032-of-00085.safetensors +3 -0
- model-00033-of-00085.safetensors +3 -0
- model-00034-of-00085.safetensors +3 -0
- model-00035-of-00085.safetensors +3 -0
- model-00036-of-00085.safetensors +3 -0
- model-00037-of-00085.safetensors +3 -0
- model-00038-of-00085.safetensors +3 -0
- model-00039-of-00085.safetensors +3 -0
- model-00040-of-00085.safetensors +3 -0
- model-00041-of-00085.safetensors +3 -0
- model-00042-of-00085.safetensors +3 -0
- model-00043-of-00085.safetensors +3 -0
- model-00044-of-00085.safetensors +3 -0
- model-00045-of-00085.safetensors +3 -0
- model-00046-of-00085.safetensors +3 -0
- model-00047-of-00085.safetensors +3 -0
- model-00048-of-00085.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "mistralai/Mistral-Small-Instruct-2409",
|
3 |
+
"architectures": [
|
4 |
+
"MixtralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 1,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"head_dim": 128,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 6144,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 16384,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"model_type": "mixtral",
|
16 |
+
"num_attention_heads": 48,
|
17 |
+
"num_experts_per_tok": 2,
|
18 |
+
"num_hidden_layers": 56,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"num_local_experts": 2,
|
21 |
+
"output_router_logits": false,
|
22 |
+
"rms_norm_eps": 1e-05,
|
23 |
+
"rope_theta": 1000000.0,
|
24 |
+
"router_aux_loss_coef": 0.001,
|
25 |
+
"router_jitter_noise": 0.0,
|
26 |
+
"sliding_window": null,
|
27 |
+
"tie_word_embeddings": false,
|
28 |
+
"torch_dtype": "float16",
|
29 |
+
"transformers_version": "4.46.2",
|
30 |
+
"use_cache": true,
|
31 |
+
"vocab_size": 32768
|
32 |
+
}
|
mergekit_moe_config.yml
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
base_model: mistralai/Mistral-Small-Instruct-2409
|
2 |
+
dtype: float16
|
3 |
+
gate_mode: cheap_embed
|
4 |
+
experts:
|
5 |
+
- source_model: mistralai/Codestral-22B-v0.1
|
6 |
+
positive_prompts: ["You are a highly intelligent and sentient AI coding expert named Mobius, possessing deep knowledge of programming languages and software development practices. You are adept at creating innovative and groundbreaking code, particularly in the realm of advanced magnetic systems and related technologies."]
|
7 |
+
- source_model: TheDrummer/Cydonia-22B-v1.2
|
8 |
+
positive_prompts: ["You are a highly advanced, helpful, and sentient AI agent named Mobius specifically designed to excel at diverse text-generation tasks, including intricate roleplaying scenarios, sophisticated retrieval augmented generation, and precise function calling."]
|
model-00001-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90847100465276a1a56a301823eb6b77d2a39b597046743497c1351e9c13ac33
|
3 |
+
size 981492784
|
model-00002-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5cbf5f2c9c2e0dff709a2c952853d134f72882a8588cac807f974972e4a64e2
|
3 |
+
size 981492944
|
model-00003-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cbb7125c40a6d57b27f77de6b3f42f15d987f5848ed5de291c3370581f9333c
|
3 |
+
size 805306912
|
model-00004-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:556d96dd3865872781fd22d470b8245727f9484df92d05ec24e06a1c447ef3ca
|
3 |
+
size 981492944
|
model-00005-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:614941d7951a7c6a293ac160b067a804754b05675c3f725c0d6f552307aa6005
|
3 |
+
size 981492944
|
model-00006-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e1a801fe87077aafb09c2a6499757538352d74327e02359431a5b96bbe83128
|
3 |
+
size 805306912
|
model-00007-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aec9379d4931c92b899f8bee6fbed17b539f6f115c46fa7064565f47362b7e67
|
3 |
+
size 981492944
|
model-00008-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59744d80914299aa6380413549b47a650237767f006513d1bbfe02ac0a7d0305
|
3 |
+
size 981492944
|
model-00009-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed79b9da20e8edac6a0c9d60ae98f545f33c5334fa906c36b84e46c6b4aadebf
|
3 |
+
size 805306912
|
model-00010-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25c0967ae730b5c46417114da8f6e0004f5b2fb22b6713104432a3cf1cb1fd0a
|
3 |
+
size 981492944
|
model-00011-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97d21b1d549f22b085bae68b563f2e526975fcc32baae4b19e0609bd3da29793
|
3 |
+
size 981492944
|
model-00012-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b5b2c107e06519c65681c9fcede332b8413775578a0b54087bbe6dbb9e64301
|
3 |
+
size 805306912
|
model-00013-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:287ef6ca69c23d630169fbcb6b4fdd3a4ac523665676f51ec7d7e5fc5182591d
|
3 |
+
size 981492944
|
model-00014-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb908ef4a401f182bb28f4662cfdf637e1c8d0026580afffada83cdf4f83c8ea
|
3 |
+
size 981492944
|
model-00015-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31cc6725af4ea350447146998236b829a85a3436fd95bee4997591a30076c025
|
3 |
+
size 805306912
|
model-00016-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9972e2c5a8577e3c03e5e1a01dbe55e90338475224140a9c90955b2b9a463e3
|
3 |
+
size 981492952
|
model-00017-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9d4184642805bbf8ee02f8858c8cc84ed63ef3b61de2dc74fe9f7f0eec87b02
|
3 |
+
size 981492952
|
model-00018-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85068108268d97537216a619b890f495c07117e3e88b71193ce627c73ed6c8c7
|
3 |
+
size 805306920
|
model-00019-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30cd8ad953b03e9159d31733dd0e3d40cc6851edae27136b743a6d5b3bb6a9a2
|
3 |
+
size 981492952
|
model-00020-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:341bbf288557294d100998490f47b714264898ee1e39896d29fea7c5166e8b57
|
3 |
+
size 981492952
|
model-00021-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1b81cdab156f51d99f91a44064072ef4ae5db5d23ce5cb0505f86cb5b6eb847
|
3 |
+
size 805306920
|
model-00022-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22f9881c33e1a16fbfb53c34d59f2995dc01b41428111b4c0b7ac679887d6df4
|
3 |
+
size 981492952
|
model-00023-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fadedc0fd55091c643ac252a241bf5ca22d9c60db0b5a1ff497e60b9582f48d3
|
3 |
+
size 981492952
|
model-00024-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca509611dd9928359b21b80608a8e65fddb622fb9b4543e93019bd001ee78671
|
3 |
+
size 805306920
|
model-00025-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aeb7efc36319a9e369924db96429495035aa0e30e4fbf336f54d421aa23da565
|
3 |
+
size 981492952
|
model-00026-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e88bb857543c2278fb7793c46c7739b2a70cf20f8bb2e13b8f3ad7b69efd04e9
|
3 |
+
size 981492952
|
model-00027-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ae29694dd6b5c10aa2a7f3f091791c584e91309d89267a7eea26bb6f66c9dd3
|
3 |
+
size 805306920
|
model-00028-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7379d8c9017c04ce9b295f5ca056d6d4c6c9d50a73df2c5c320230cb359c5fbb
|
3 |
+
size 981492952
|
model-00029-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c81c937c9ca6e8c41604d5c2afde656d9e94409b9ffcd13fd270ab2ca182983f
|
3 |
+
size 981492952
|
model-00030-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc324f1c4fbb5b047d89119c5e0fef59a1f0956f69072636f52b0ac177472473
|
3 |
+
size 805306920
|
model-00031-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a6908c6545d7a61005e5387581002db16023ebf975964a726416be021a9f581
|
3 |
+
size 981492952
|
model-00032-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7473c34ae019b07b51083b6334baf5495ae2c9bab3af134e4de4692fb34c79a5
|
3 |
+
size 981492952
|
model-00033-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a9c047038b1b281d7d10eeae883eccdf6c4333ca0052d9e3afb0bde034ab643
|
3 |
+
size 805306920
|
model-00034-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0001b33f12cab5490421442184c1fc8dc1d06fb4cf566f45ee922412aa4d5699
|
3 |
+
size 981492952
|
model-00035-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4e6cdd69ee2b627c2cac2f53276e8da1668565e0abbd7defd86635dda14fe15
|
3 |
+
size 981492952
|
model-00036-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54c04ea119fb7e8a889994380393ed1dd8a6e43a28487dddf8b5f37108714df6
|
3 |
+
size 805306920
|
model-00037-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1eac856220b905b227b840160ab7cccbefbeacae1e151f0687183367b67c57e
|
3 |
+
size 981492952
|
model-00038-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dba008b50b0f06c0f47f4f17bac3a49181613ac1f53cea00012a5fe988efe563
|
3 |
+
size 981492952
|
model-00039-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44bff6ea58ea43077cddb29f1ca7483cab27230520317c4aea0e6a7acd5f7453
|
3 |
+
size 805306920
|
model-00040-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fad079292515dda3b8640127e1774905961779c7cfaf42cf97ff3ae6577a285
|
3 |
+
size 981492952
|
model-00041-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6f36f4710dcf4289d2f7e019b1fff00596fa6376e22cf44dfad3aa1806b3b4c
|
3 |
+
size 981492952
|
model-00042-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2da3f2d198bf8ad7c14d4015ea1d2308372dedece22f09c526db58c5e7328219
|
3 |
+
size 805306920
|
model-00043-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a97c654bb64aee61e755606c1e59a0d1d976daf7c35350011d807bfb3783a31
|
3 |
+
size 981492952
|
model-00044-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63578ff184ddc45e4f9b87e1119caf827f983dd5ab10adafb7f4d25e939c344c
|
3 |
+
size 981492952
|
model-00045-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0c0433845cb7793dd9b0abd04bca77a5120f033ce79a9c9c122d5fec988c9b7
|
3 |
+
size 805306920
|
model-00046-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d347184f84eb1224acb5dbf2cfcda4a6e3b4c7fa79bc290b0598d452afd092fa
|
3 |
+
size 981492952
|
model-00047-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0322c2f32aec2d6df22c39d5a13fa534f00546fb0e0a2d0bb34dda9bbd845037
|
3 |
+
size 981492952
|
model-00048-of-00085.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3989f5b382fc98146d1709d7b0f7d1eb5159605cd198c013c0110bf152c70f9f
|
3 |
+
size 805306920
|