MetaphoricalCode commited on
Commit
599e9ef
·
verified ·
1 Parent(s): 5e950fe

Upload 14 files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Cydonia-v1.3-magnum-v4-22B.png filter=lfs diff=lfs merge=lfs -text
Cydonia-v1.3-magnum-v4-22B.png ADDED

Git LFS Details

  • SHA256: 11b18147c8c2f240f7b39fa8cc63c0f8c04dac5f077e20c260b26d950dd83125
  • Pointer size: 131 Bytes
  • Size of remote file: 828 kB
README.md ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model:
3
+ - knifeayumu/Cydonia-v1.3-Magnum-v4-22B
4
+ base_model_relation: quantized
5
+ library_name: transformers
6
+ tags:
7
+ - mergekit
8
+ - merge
9
+ license: other
10
+ license_name: mrl
11
+ inference: false
12
+ license_link: https://mistral.ai/licenses/MRL-0.1.md
13
+ ---
14
+ ## Quantized using the default exllamav3 (0.0.1) quantization process.
15
+
16
+ - Original model: https://huggingface.co/knifeayumu/Cydonia-v1.3-Magnum-v4-22B
17
+ - exllamav3: https://github.com/turboderp-org/exllamav3
18
+ ---
19
+ ![Not Horny Enough](Cydonia-v1.3-magnum-v4-22B.png)
20
+
21
+ # The Drummer becomes hornier (again)
22
+
23
+ Recipe based on [knifeayumu/Cydonia-v1.2-Magnum-v4-22B](https://huggingface.co/knifeayumu/Cydonia-v1.2-Magnum-v4-22B) but uses [TheDrummer/Cydonia-22B-v1.3](https://huggingface.co/TheDrummer/Cydonia-22B-v1.3) as the base.
24
+ Yes, MortalWombat. I'm gonna use your parameters as long as I can!
25
+
26
+ This is a merge of pre-trained language models created using [mergekit](https://github.com/arcee-ai/mergekit).
27
+
28
+ ## Merge Details
29
+ ### Merge Method
30
+
31
+ This model was merged using the SLERP merge method.
32
+
33
+ ### Models Merged
34
+
35
+ The following models were included in the merge:
36
+ * [TheDrummer/Cydonia-22B-v1.3](https://huggingface.co/TheDrummer/Cydonia-22B-v1.3)
37
+ * [anthracite-org/magnum-v4-22b](https://huggingface.co/anthracite-org/magnum-v4-22b)
38
+
39
+ ### Configuration
40
+
41
+ The following YAML configuration was used to produce this model:
42
+
43
+ ```yaml
44
+ models:
45
+ - model: TheDrummer/Cydonia-22B-v1.3
46
+ - model: anthracite-org/magnum-v4-22b
47
+ merge_method: slerp
48
+ base_model: TheDrummer/Cydonia-22B-v1.3
49
+ parameters:
50
+ t: [0.1, 0.3, 0.6, 0.3, 0.1]
51
+ dtype: bfloat16
52
+ ```
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "TheDrummer/Cydonia-22B-v1.3",
3
+ "architectures": [
4
+ "MistralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 6144,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 16384,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "mistral",
16
+ "num_attention_heads": 48,
17
+ "num_hidden_layers": 56,
18
+ "num_key_value_heads": 8,
19
+ "rms_norm_eps": 1e-05,
20
+ "rope_theta": 1000000.0,
21
+ "sliding_window": null,
22
+ "tie_word_embeddings": false,
23
+ "torch_dtype": "bfloat16",
24
+ "transformers_version": "4.46.2",
25
+ "use_cache": true,
26
+ "vocab_size": 32768,
27
+ "quantization_config": {
28
+ "quant_method": "exl3",
29
+ "version": "0.0.1",
30
+ "bits": 8.0,
31
+ "head_bits": 8,
32
+ "calibration": {
33
+ "rows": 100,
34
+ "cols": 2048
35
+ },
36
+ "out_scales": "auto"
37
+ }
38
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ models:
2
+ - model: TheDrummer/Cydonia-22B-v1.3
3
+ - model: anthracite-org/magnum-v4-22b
4
+ merge_method: slerp
5
+ base_model: TheDrummer/Cydonia-22B-v1.3
6
+ parameters:
7
+ t: [0.1, 0.3, 0.6, 0.3, 0.1]
8
+ dtype: bfloat16
model-00001-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43f1c90be4c818412160faa2e9cb96f4225e219570cae237e2494a6de802fc85
3
+ size 8208860560
model-00002-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf5dd253838fa827117b6b081373a2ac42bd55b85c40aea0ed4f6ad0a88d52a2
3
+ size 8586826696
model-00003-of-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e88af2479ca1549e76dd3cf2634655e975f7bc4f2679931f99e1ecf80d8541d0
3
+ size 5665761256
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
quantization_config.json ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<unk>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59f95e28944c062244741268596badc900df86c7f5ded05088d2da22a7379e06
3
+ size 587583
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff