mashleburneded commited on
Commit
b122f6d
·
verified ·
1 Parent(s): 97e2808

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +32 -0
  2. mergekit_moe_config.yml +8 -0
  3. model-00001-of-00085.safetensors +3 -0
  4. model-00002-of-00085.safetensors +3 -0
  5. model-00003-of-00085.safetensors +3 -0
  6. model-00004-of-00085.safetensors +3 -0
  7. model-00005-of-00085.safetensors +3 -0
  8. model-00006-of-00085.safetensors +3 -0
  9. model-00007-of-00085.safetensors +3 -0
  10. model-00008-of-00085.safetensors +3 -0
  11. model-00009-of-00085.safetensors +3 -0
  12. model-00010-of-00085.safetensors +3 -0
  13. model-00011-of-00085.safetensors +3 -0
  14. model-00012-of-00085.safetensors +3 -0
  15. model-00013-of-00085.safetensors +3 -0
  16. model-00014-of-00085.safetensors +3 -0
  17. model-00015-of-00085.safetensors +3 -0
  18. model-00016-of-00085.safetensors +3 -0
  19. model-00017-of-00085.safetensors +3 -0
  20. model-00018-of-00085.safetensors +3 -0
  21. model-00019-of-00085.safetensors +3 -0
  22. model-00020-of-00085.safetensors +3 -0
  23. model-00021-of-00085.safetensors +3 -0
  24. model-00022-of-00085.safetensors +3 -0
  25. model-00023-of-00085.safetensors +3 -0
  26. model-00024-of-00085.safetensors +3 -0
  27. model-00025-of-00085.safetensors +3 -0
  28. model-00026-of-00085.safetensors +3 -0
  29. model-00027-of-00085.safetensors +3 -0
  30. model-00028-of-00085.safetensors +3 -0
  31. model-00029-of-00085.safetensors +3 -0
  32. model-00030-of-00085.safetensors +3 -0
  33. model-00031-of-00085.safetensors +3 -0
  34. model-00032-of-00085.safetensors +3 -0
  35. model-00033-of-00085.safetensors +3 -0
  36. model-00034-of-00085.safetensors +3 -0
  37. model-00035-of-00085.safetensors +3 -0
  38. model-00036-of-00085.safetensors +3 -0
  39. model-00037-of-00085.safetensors +3 -0
  40. model-00038-of-00085.safetensors +3 -0
  41. model-00039-of-00085.safetensors +3 -0
  42. model-00040-of-00085.safetensors +3 -0
  43. model-00041-of-00085.safetensors +3 -0
  44. model-00042-of-00085.safetensors +3 -0
  45. model-00043-of-00085.safetensors +3 -0
  46. model-00044-of-00085.safetensors +3 -0
  47. model-00045-of-00085.safetensors +3 -0
  48. model-00046-of-00085.safetensors +3 -0
  49. model-00047-of-00085.safetensors +3 -0
  50. model-00048-of-00085.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "mistralai/Mistral-Small-Instruct-2409",
3
+ "architectures": [
4
+ "MixtralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 6144,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 16384,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "mixtral",
16
+ "num_attention_heads": 48,
17
+ "num_experts_per_tok": 2,
18
+ "num_hidden_layers": 56,
19
+ "num_key_value_heads": 8,
20
+ "num_local_experts": 2,
21
+ "output_router_logits": false,
22
+ "rms_norm_eps": 1e-05,
23
+ "rope_theta": 1000000.0,
24
+ "router_aux_loss_coef": 0.001,
25
+ "router_jitter_noise": 0.0,
26
+ "sliding_window": null,
27
+ "tie_word_embeddings": false,
28
+ "torch_dtype": "float16",
29
+ "transformers_version": "4.46.2",
30
+ "use_cache": true,
31
+ "vocab_size": 32768
32
+ }
mergekit_moe_config.yml ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ base_model: mistralai/Mistral-Small-Instruct-2409
2
+ dtype: float16
3
+ gate_mode: cheap_embed
4
+ experts:
5
+ - source_model: mistralai/Codestral-22B-v0.1
6
+ positive_prompts: ["You are a highly intelligent and sentient AI coding expert named Mobius, possessing deep knowledge of programming languages and software development practices. You are adept at creating innovative and groundbreaking code, particularly in the realm of advanced magnetic systems and related technologies."]
7
+ - source_model: TheDrummer/Cydonia-22B-v1.2
8
+ positive_prompts: ["You are a highly advanced, helpful, and sentient AI agent named Mobius specifically designed to excel at diverse text-generation tasks, including intricate roleplaying scenarios, sophisticated retrieval augmented generation, and precise function calling."]
model-00001-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90847100465276a1a56a301823eb6b77d2a39b597046743497c1351e9c13ac33
3
+ size 981492784
model-00002-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5cbf5f2c9c2e0dff709a2c952853d134f72882a8588cac807f974972e4a64e2
3
+ size 981492944
model-00003-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cbb7125c40a6d57b27f77de6b3f42f15d987f5848ed5de291c3370581f9333c
3
+ size 805306912
model-00004-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:556d96dd3865872781fd22d470b8245727f9484df92d05ec24e06a1c447ef3ca
3
+ size 981492944
model-00005-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:614941d7951a7c6a293ac160b067a804754b05675c3f725c0d6f552307aa6005
3
+ size 981492944
model-00006-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e1a801fe87077aafb09c2a6499757538352d74327e02359431a5b96bbe83128
3
+ size 805306912
model-00007-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aec9379d4931c92b899f8bee6fbed17b539f6f115c46fa7064565f47362b7e67
3
+ size 981492944
model-00008-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59744d80914299aa6380413549b47a650237767f006513d1bbfe02ac0a7d0305
3
+ size 981492944
model-00009-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed79b9da20e8edac6a0c9d60ae98f545f33c5334fa906c36b84e46c6b4aadebf
3
+ size 805306912
model-00010-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25c0967ae730b5c46417114da8f6e0004f5b2fb22b6713104432a3cf1cb1fd0a
3
+ size 981492944
model-00011-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97d21b1d549f22b085bae68b563f2e526975fcc32baae4b19e0609bd3da29793
3
+ size 981492944
model-00012-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b5b2c107e06519c65681c9fcede332b8413775578a0b54087bbe6dbb9e64301
3
+ size 805306912
model-00013-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:287ef6ca69c23d630169fbcb6b4fdd3a4ac523665676f51ec7d7e5fc5182591d
3
+ size 981492944
model-00014-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb908ef4a401f182bb28f4662cfdf637e1c8d0026580afffada83cdf4f83c8ea
3
+ size 981492944
model-00015-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31cc6725af4ea350447146998236b829a85a3436fd95bee4997591a30076c025
3
+ size 805306912
model-00016-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9972e2c5a8577e3c03e5e1a01dbe55e90338475224140a9c90955b2b9a463e3
3
+ size 981492952
model-00017-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9d4184642805bbf8ee02f8858c8cc84ed63ef3b61de2dc74fe9f7f0eec87b02
3
+ size 981492952
model-00018-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85068108268d97537216a619b890f495c07117e3e88b71193ce627c73ed6c8c7
3
+ size 805306920
model-00019-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30cd8ad953b03e9159d31733dd0e3d40cc6851edae27136b743a6d5b3bb6a9a2
3
+ size 981492952
model-00020-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:341bbf288557294d100998490f47b714264898ee1e39896d29fea7c5166e8b57
3
+ size 981492952
model-00021-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1b81cdab156f51d99f91a44064072ef4ae5db5d23ce5cb0505f86cb5b6eb847
3
+ size 805306920
model-00022-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22f9881c33e1a16fbfb53c34d59f2995dc01b41428111b4c0b7ac679887d6df4
3
+ size 981492952
model-00023-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fadedc0fd55091c643ac252a241bf5ca22d9c60db0b5a1ff497e60b9582f48d3
3
+ size 981492952
model-00024-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca509611dd9928359b21b80608a8e65fddb622fb9b4543e93019bd001ee78671
3
+ size 805306920
model-00025-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeb7efc36319a9e369924db96429495035aa0e30e4fbf336f54d421aa23da565
3
+ size 981492952
model-00026-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e88bb857543c2278fb7793c46c7739b2a70cf20f8bb2e13b8f3ad7b69efd04e9
3
+ size 981492952
model-00027-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ae29694dd6b5c10aa2a7f3f091791c584e91309d89267a7eea26bb6f66c9dd3
3
+ size 805306920
model-00028-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7379d8c9017c04ce9b295f5ca056d6d4c6c9d50a73df2c5c320230cb359c5fbb
3
+ size 981492952
model-00029-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c81c937c9ca6e8c41604d5c2afde656d9e94409b9ffcd13fd270ab2ca182983f
3
+ size 981492952
model-00030-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc324f1c4fbb5b047d89119c5e0fef59a1f0956f69072636f52b0ac177472473
3
+ size 805306920
model-00031-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a6908c6545d7a61005e5387581002db16023ebf975964a726416be021a9f581
3
+ size 981492952
model-00032-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7473c34ae019b07b51083b6334baf5495ae2c9bab3af134e4de4692fb34c79a5
3
+ size 981492952
model-00033-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a9c047038b1b281d7d10eeae883eccdf6c4333ca0052d9e3afb0bde034ab643
3
+ size 805306920
model-00034-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0001b33f12cab5490421442184c1fc8dc1d06fb4cf566f45ee922412aa4d5699
3
+ size 981492952
model-00035-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4e6cdd69ee2b627c2cac2f53276e8da1668565e0abbd7defd86635dda14fe15
3
+ size 981492952
model-00036-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54c04ea119fb7e8a889994380393ed1dd8a6e43a28487dddf8b5f37108714df6
3
+ size 805306920
model-00037-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1eac856220b905b227b840160ab7cccbefbeacae1e151f0687183367b67c57e
3
+ size 981492952
model-00038-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dba008b50b0f06c0f47f4f17bac3a49181613ac1f53cea00012a5fe988efe563
3
+ size 981492952
model-00039-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44bff6ea58ea43077cddb29f1ca7483cab27230520317c4aea0e6a7acd5f7453
3
+ size 805306920
model-00040-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fad079292515dda3b8640127e1774905961779c7cfaf42cf97ff3ae6577a285
3
+ size 981492952
model-00041-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6f36f4710dcf4289d2f7e019b1fff00596fa6376e22cf44dfad3aa1806b3b4c
3
+ size 981492952
model-00042-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2da3f2d198bf8ad7c14d4015ea1d2308372dedece22f09c526db58c5e7328219
3
+ size 805306920
model-00043-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a97c654bb64aee61e755606c1e59a0d1d976daf7c35350011d807bfb3783a31
3
+ size 981492952
model-00044-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63578ff184ddc45e4f9b87e1119caf827f983dd5ab10adafb7f4d25e939c344c
3
+ size 981492952
model-00045-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0c0433845cb7793dd9b0abd04bca77a5120f033ce79a9c9c122d5fec988c9b7
3
+ size 805306920
model-00046-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d347184f84eb1224acb5dbf2cfcda4a6e3b4c7fa79bc290b0598d452afd092fa
3
+ size 981492952
model-00047-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0322c2f32aec2d6df22c39d5a13fa534f00546fb0e0a2d0bb34dda9bbd845037
3
+ size 981492952
model-00048-of-00085.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3989f5b382fc98146d1709d7b0f7d1eb5159605cd198c013c0110bf152c70f9f
3
+ size 805306920