Add llm_config.json (Q4+int4 PLE, requires TokForge 3.4.9)
Browse files- llm_config.json +48 -0
llm_config.json
ADDED
|
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "gemma4",
|
| 3 |
+
"hidden_size": 2560,
|
| 4 |
+
"attention_mask": "float",
|
| 5 |
+
"attention_type": "mix",
|
| 6 |
+
"is_mrope": false,
|
| 7 |
+
"layer_nums": 42,
|
| 8 |
+
"hidden_size_per_layer_input": 256,
|
| 9 |
+
"per_layer_embedding_hidden_size": 10752,
|
| 10 |
+
"per_layer_embedding_file": "per_layer_embeddings_int4.bin",
|
| 11 |
+
"per_layer_scale_emb": 16.0,
|
| 12 |
+
"use_template": true,
|
| 13 |
+
"force_full_decode_recompute": false,
|
| 14 |
+
"jinja": {
|
| 15 |
+
"chat_template": "{{ bos_token }}{% for message in messages %}{% if message.role == \"system\" %}<|turn>system\n{{ message.content }}<turn|>\n{% elif message.role == \"user\" %}<|turn>user\n{{ message.content }}<turn|>\n{% elif message.role == \"assistant\" %}<|turn>model\n{{ message.content }}<turn|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|turn>model\n{% endif %}",
|
| 16 |
+
"bos": "<bos>",
|
| 17 |
+
"eos": "<turn|>"
|
| 18 |
+
},
|
| 19 |
+
"scale_emb": 50.5,
|
| 20 |
+
"sampler_type": "mixed",
|
| 21 |
+
"temperature": 1.0,
|
| 22 |
+
"top_k": 64,
|
| 23 |
+
"top_p": 0.95,
|
| 24 |
+
"min_p": 0.0,
|
| 25 |
+
"tfs_z": 1.0,
|
| 26 |
+
"typical": 1.0,
|
| 27 |
+
"repetition_penalty": 1.0,
|
| 28 |
+
"presence_penalty": 0.0,
|
| 29 |
+
"frequency_penalty": 0.0,
|
| 30 |
+
"penalty_window": 0,
|
| 31 |
+
"n_gram": 8,
|
| 32 |
+
"ngram_factor": 1.0,
|
| 33 |
+
"sliding_window": 512,
|
| 34 |
+
"tie_embeddings": [
|
| 35 |
+
0,
|
| 36 |
+
335544320,
|
| 37 |
+
41943040,
|
| 38 |
+
4,
|
| 39 |
+
128
|
| 40 |
+
],
|
| 41 |
+
"ple_quant": [
|
| 42 |
+
0,
|
| 43 |
+
1409286144,
|
| 44 |
+
176160768,
|
| 45 |
+
4,
|
| 46 |
+
128
|
| 47 |
+
]
|
| 48 |
+
}
|