Holy-fox commited on
Commit
49b3c61
·
verified ·
1 Parent(s): 5b342a4

Upload 76 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +40 -3
  3. added_tokens.json +24 -0
  4. config.json +29 -0
  5. mergekit_config.yml +9 -0
  6. merges.txt +0 -0
  7. model-00001-of-00066.safetensors +3 -0
  8. model-00002-of-00066.safetensors +3 -0
  9. model-00003-of-00066.safetensors +3 -0
  10. model-00004-of-00066.safetensors +3 -0
  11. model-00005-of-00066.safetensors +3 -0
  12. model-00006-of-00066.safetensors +3 -0
  13. model-00007-of-00066.safetensors +3 -0
  14. model-00008-of-00066.safetensors +3 -0
  15. model-00009-of-00066.safetensors +3 -0
  16. model-00010-of-00066.safetensors +3 -0
  17. model-00011-of-00066.safetensors +3 -0
  18. model-00012-of-00066.safetensors +3 -0
  19. model-00013-of-00066.safetensors +3 -0
  20. model-00014-of-00066.safetensors +3 -0
  21. model-00015-of-00066.safetensors +3 -0
  22. model-00016-of-00066.safetensors +3 -0
  23. model-00017-of-00066.safetensors +3 -0
  24. model-00018-of-00066.safetensors +3 -0
  25. model-00019-of-00066.safetensors +3 -0
  26. model-00020-of-00066.safetensors +3 -0
  27. model-00021-of-00066.safetensors +3 -0
  28. model-00022-of-00066.safetensors +3 -0
  29. model-00023-of-00066.safetensors +3 -0
  30. model-00024-of-00066.safetensors +3 -0
  31. model-00025-of-00066.safetensors +3 -0
  32. model-00026-of-00066.safetensors +3 -0
  33. model-00027-of-00066.safetensors +3 -0
  34. model-00028-of-00066.safetensors +3 -0
  35. model-00029-of-00066.safetensors +3 -0
  36. model-00030-of-00066.safetensors +3 -0
  37. model-00031-of-00066.safetensors +3 -0
  38. model-00032-of-00066.safetensors +3 -0
  39. model-00033-of-00066.safetensors +3 -0
  40. model-00034-of-00066.safetensors +3 -0
  41. model-00035-of-00066.safetensors +3 -0
  42. model-00036-of-00066.safetensors +3 -0
  43. model-00037-of-00066.safetensors +3 -0
  44. model-00038-of-00066.safetensors +3 -0
  45. model-00039-of-00066.safetensors +3 -0
  46. model-00040-of-00066.safetensors +3 -0
  47. model-00041-of-00066.safetensors +3 -0
  48. model-00042-of-00066.safetensors +3 -0
  49. model-00043-of-00066.safetensors +3 -0
  50. model-00044-of-00066.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -1,3 +1,40 @@
1
- ---
2
- license: apache-2.0
3
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model:
3
+ - Saxo/Linkbricks-Horizon-AI-Japanese-Base-32B
4
+ - karakuri-ai/karakuri-lm-32b-thinking-2501-exp
5
+ library_name: transformers
6
+ tags:
7
+ - mergekit
8
+ - merge
9
+
10
+ ---
11
+ # SKYCAVE_element_QwQ_jp
12
+
13
+ This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
14
+
15
+ ## Merge Details
16
+ ### Merge Method
17
+
18
+ This model was merged using the [SLERP](https://en.wikipedia.org/wiki/Slerp) merge method.
19
+
20
+ ### Models Merged
21
+
22
+ The following models were included in the merge:
23
+ * [Saxo/Linkbricks-Horizon-AI-Japanese-Base-32B](https://huggingface.co/Saxo/Linkbricks-Horizon-AI-Japanese-Base-32B)
24
+ * [karakuri-ai/karakuri-lm-32b-thinking-2501-exp](https://huggingface.co/karakuri-ai/karakuri-lm-32b-thinking-2501-exp)
25
+
26
+ ### Configuration
27
+
28
+ The following YAML configuration was used to produce this model:
29
+
30
+ ```yaml
31
+ merge_method: slerp
32
+ base_model: karakuri-ai/karakuri-lm-32b-thinking-2501-exp
33
+ models:
34
+ - model: karakuri-ai/karakuri-lm-32b-thinking-2501-exp
35
+ - model: Saxo/Linkbricks-Horizon-AI-Japanese-Base-32B
36
+ parameters:
37
+ t: 0.35
38
+ dtype: bfloat16
39
+ name: SKYCAVE_element_QwQ_jp
40
+ ```
added_tokens.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "</tool_call>": 151658,
3
+ "<tool_call>": 151657,
4
+ "<|box_end|>": 151649,
5
+ "<|box_start|>": 151648,
6
+ "<|endoftext|>": 151643,
7
+ "<|file_sep|>": 151664,
8
+ "<|fim_middle|>": 151660,
9
+ "<|fim_pad|>": 151662,
10
+ "<|fim_prefix|>": 151659,
11
+ "<|fim_suffix|>": 151661,
12
+ "<|im_end|>": 151645,
13
+ "<|im_start|>": 151644,
14
+ "<|image_pad|>": 151655,
15
+ "<|object_ref_end|>": 151647,
16
+ "<|object_ref_start|>": 151646,
17
+ "<|quad_end|>": 151651,
18
+ "<|quad_start|>": 151650,
19
+ "<|repo_name|>": 151663,
20
+ "<|video_pad|>": 151656,
21
+ "<|vision_end|>": 151653,
22
+ "<|vision_pad|>": 151654,
23
+ "<|vision_start|>": 151652
24
+ }
config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "karakuri-ai/karakuri-lm-32b-thinking-2501-exp",
3
+ "architectures": [
4
+ "Qwen2ForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 151643,
8
+ "eos_token_id": 151645,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 5120,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 27648,
13
+ "max_position_embeddings": 32768,
14
+ "max_window_layers": 64,
15
+ "model_type": "qwen2",
16
+ "num_attention_heads": 40,
17
+ "num_hidden_layers": 64,
18
+ "num_key_value_heads": 8,
19
+ "rms_norm_eps": 1e-05,
20
+ "rope_scaling": null,
21
+ "rope_theta": 1000000.0,
22
+ "sliding_window": null,
23
+ "tie_word_embeddings": false,
24
+ "torch_dtype": "bfloat16",
25
+ "transformers_version": "4.48.1",
26
+ "use_cache": true,
27
+ "use_sliding_window": false,
28
+ "vocab_size": 152064
29
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ merge_method: slerp
2
+ base_model: karakuri-ai/karakuri-lm-32b-thinking-2501-exp
3
+ models:
4
+ - model: karakuri-ai/karakuri-lm-32b-thinking-2501-exp
5
+ - model: Saxo/Linkbricks-Horizon-AI-Japanese-Base-32B
6
+ parameters:
7
+ t: 0.35
8
+ dtype: bfloat16
9
+ name: SKYCAVE_element_QwQ_jp
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d08720dee93b8c6241a03e1e77d2669a85836ca1504bca21a3c7006e1c02f867
3
+ size 1557135488
model-00002-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76e59bb87d74415d6e2e514902d7db6bddab8dbc6e40f5b389bebf22becdd911
3
+ size 1557135504
model-00003-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae63642ee25da9821a35b1c5654bc78c1c72c1663a7da3fdecf2353ce68d054a
3
+ size 975222224
model-00004-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9333053225b655a753e0923dbbbc77f72613922829735faa26bdc7934b27724
3
+ size 975211880
model-00005-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ba3463e26fcc62194e24aa2356ae922980525081fbb0aa78e01a2108f51e301
3
+ size 975211888
model-00006-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00520616f4ba6ab0f727ce8298a4b5f87f55a2d5b3fdac73428be68dcf491163
3
+ size 975211888
model-00007-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0496857f5cba2c04776d4a08cf49c43362189363ce19ac8bd8d057bc6e2056e3
3
+ size 975211888
model-00008-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:435deaefc72176d3f5c35dc56e64e448dd3241008668ea8e0a75e1b4fcabb733
3
+ size 975211888
model-00009-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b003fd3f21e568541835693e76789feb68c8d1bae077806c98e1aae14fdc9e36
3
+ size 975211888
model-00010-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2be967f2ab97aa7dd07d90e370298efe488e854ace6190c175b03a13c1c04ca
3
+ size 975211888
model-00011-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:312c133c84c2ccf8c888825ff3d8b804304b962b0008b8b5c492366dcd8075f1
3
+ size 975211888
model-00012-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fda7147476cc49efe1fcd69940f0f2c769a07dbb420a4b472260d9f8ee7f351
3
+ size 975211888
model-00013-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45e29feaa716b81d4f3170ba4c100ac7e1a8facb05b8bdd56e3faec6f0596339
3
+ size 975211888
model-00014-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cad3252e284282711eea33e6861da9ef34073c28beb7c5b90951f4014a09f137
3
+ size 975211888
model-00015-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d549091cb5c31d4bb9991f8aade8914697c0a950203f0b9adff09a3c2f3faba
3
+ size 975211880
model-00016-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c19d29e566ee3d0b5d0cf4f467181b7f40c36ee9373634e2c4dcdbbd226aa813
3
+ size 975211888
model-00017-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27c508d1a3baa9b7685ee8d69f382831a9e66fa3b24d6c889f6514b4d7d7954d
3
+ size 975211888
model-00018-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6e2c641457d52a2e2a2dabf5c44daa6dea383a36214e24969601c243a99bc42
3
+ size 975211888
model-00019-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:743089cf1bdbd86b8edb9c86ac9e7a32ec4fdaf7f600aef0f73676b562fc9699
3
+ size 975211888
model-00020-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a0a262f544f2a025d956f33809af6cd773540847e636b006ae6ff29ac94f10a
3
+ size 975211888
model-00021-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2812ba15992f2ef9f21853ef6c5a3f74844ffd1c63e89939b193355cf012f85e
3
+ size 975211888
model-00022-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc9e6d1539b5a170d66c8d43f9c799b1b4db5378d9f05da40ba193bb75255c8b
3
+ size 975211888
model-00023-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e415a20320449198e1fdbf12fbdbf2c6b2723679c1617677f82b43da6c714b10
3
+ size 975211888
model-00024-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcf57f615bca9f7c16ba37b1be0b2c88e381b32d663ad81ccaac1356526e9495
3
+ size 975211888
model-00025-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4590501d1e9c0604672d7f24d8c7e2e5a15f6075bfcd4179f33a651c3b4db8bf
3
+ size 975211888
model-00026-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fa597b8c8f892503d80d4b72102ec76c0e7d3226cfb040a564168f626ceb953
3
+ size 975211880
model-00027-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8f249f0f7dc64dd96e611ad5d2bfa6091e483fd450f8ccbe3aac81059b0409f
3
+ size 975211888
model-00028-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:525059d7c78ad06236c41f7886495f03bd1c767d5ef51744fbe85f1249f35f0f
3
+ size 975211888
model-00029-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:957d85928fcd5f176cea7ee12082747be89589383b4c90613576d4d91e8d237a
3
+ size 975211888
model-00030-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60412bafafdc81560ffd4f77fc237838dfcfccd86d6bbf1781f4f072efa21819
3
+ size 975211888
model-00031-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:099694806f44ed713bc248edb1b2b60c6a21c5b37addd4f4ef08e9e8fd0503e9
3
+ size 975211888
model-00032-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a600914171661a2f4b54c504badb318e0bab403445fd27f4b3873bab5818502
3
+ size 975211888
model-00033-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:569ed53992b8e4a2353cbb2b57801e5a1827d62ae2b85cdef1a1edc199664bbf
3
+ size 975211888
model-00034-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69452432554d62404ec77732f1d997b8891a9238884a6deb114c707fbb517c08
3
+ size 975211888
model-00035-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b2dbaec1c8cde73dffb17aa7cfb98b829e53f915fe9b0db0423e2baf10d0c54
3
+ size 975211888
model-00036-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6814c6300161130dacd6163164b41e1108eab4285a6dd9bc9532005585cf59d
3
+ size 975211888
model-00037-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5748ba5131b069b25cebc1eba3bdac7f2606357c78fdcf54c9017fa277891fd1
3
+ size 975211880
model-00038-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c7beb63c0ce8713e7c2da33d25dfad899162d251f345be7aa4f1297a28581be
3
+ size 975211888
model-00039-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65a5fad6ecc269602ddd1b6d6230dff8b0f3713add44f7acf203fa6792e0095b
3
+ size 975211888
model-00040-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ac9de52b3092d44cc0625d147b410ff7e6f0e69be91f27c35c09e3c8a46fd2c
3
+ size 975211888
model-00041-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab205964b657d5520e5c6ecb14fe0c6bd4caaa63ba0330a7c0c3d00ed4155890
3
+ size 975211888
model-00042-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93a6071091ddc02058692303c1f5f3ee828b6bb1dae877dc076320c7729418d4
3
+ size 975211888
model-00043-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5ab3923216ed4cf18352514c13ca8d804427d396b78116a146b1c06fdf6d985
3
+ size 975211888
model-00044-of-00066.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c788db0b84787af920a4907486d1e5cce7a12763b85400ee278664ea2c366a40
3
+ size 975211888