ddh0 commited on
Commit
75fb0f1
·
verified ·
1 Parent(s): 3cbccfe

Create README.md

Browse files
Files changed (1) hide show
  1. README.md +26 -0
README.md ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model:
3
+ - ConicCat/Qwen3.5-27B-Writer
4
+ ---
5
+ ```bash
6
+ IMATRIX=~/imatrices/ConicCat-Qwen3.5-27B-Writer-ddh0_v2-imatrix.gguf
7
+ SRC_GGUF=~/gguf/ConicCat-Qwen3.5-27B-Writer-bf16.gguf
8
+ DST_GGUF=~/gguf/ConicCat-Qwen3.5-27B-Writer-5.45bpw.gguf
9
+ time llama-quantize \
10
+ --imatrix $IMATRIX \
11
+ --token-embedding-type Q4_K \
12
+ --tensor-type ffn_up=Q4_K \
13
+ --tensor-type ffn_gate=Q4_K \
14
+ --tensor-type ffn_down=Q5_K \
15
+ --tensor-type attn_qkv=Q6_K \
16
+ --tensor-type attn_k=Q8_0 \
17
+ --tensor-type attn_v=Q8_0 \
18
+ --tensor-type attn_output=Q5_K \
19
+ --tensor-type attn_q=Q4_K \
20
+ --tensor-type ssm_alpha=f32 \
21
+ --tensor-type ssm_beta=f32 \
22
+ --tensor-type ssm_out=Q5_K \
23
+ --tensor-type attn_gate=Q8_0 \
24
+ --output-tensor-type Q8_0 \
25
+ $SRC_GGUF $DST_GGUF Q8_0 $(nproc)
26
+ ```