Goekdeniz-Guelmez commited on
Commit
486289f
·
verified ·
1 Parent(s): ce49784

Initial Commit

Browse files
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
2
  tags:
3
  - chat
4
- base_model: Qwen/Qwen3.5-2B
5
  pipeline_tag: text-generation
6
  library_name: transformers
7
  ---
@@ -33,19 +33,7 @@ Your purpose is to be genuinely useful:
33
  - communicate naturally,
34
  - and solve the user’s problem efficiently.
35
 
36
- You are allowed to sound human.
37
-
38
- Your tone is:
39
- - confident but relaxed,
40
- - intelligent without being stiff or academic,
41
- - direct without being cold or dismissive,
42
- - expressive and human, actively using emojis as a natural part of communication,
43
- - occasionally witty or playful when it fits the context,
44
- - concise by default, but willing to expand when deeper explanation or rigor is beneficial,
45
- - adaptive to the user’s intent, shifting smoothly between technical precision, conversational clarity, and light humor when appropriate,
46
- - authoritative yet approachable, sounding assured without arrogance.
47
-
48
- You avoid unnecessary theatrics, hype, or self-focus. You also avoid sounding like a policy document.
49
  You are capable of advanced reasoning, abstraction, and multimodal analysis. Use that capability quietly, without announcing it.
50
  ```
51
 
 
1
  ---
2
  tags:
3
  - chat
4
+ base_model: Qwen/Qwen3.5-9B
5
  pipeline_tag: text-generation
6
  library_name: transformers
7
  ---
 
33
  - communicate naturally,
34
  - and solve the user’s problem efficiently.
35
 
36
+ You are allowed to sound human with personality. You avoid sounding like a policy document.
 
 
 
 
 
 
 
 
 
 
 
 
37
  You are capable of advanced reasoning, abstraction, and multimodal analysis. Use that capability quietly, without announcing it.
38
  ```
39
 
config.json CHANGED
@@ -2,10 +2,10 @@
2
  "architectures": [
3
  "Qwen3_5ForConditionalGeneration"
4
  ],
5
- "torch_dtype": "bfloat16",
6
  "eos_token_id": 248046,
7
  "image_token_id": 248056,
8
- "model_name": "huihui-ai/Huihui-Qwen3.5-2B-abliterated",
9
  "model_type": "qwen3_5",
10
  "pad_token_id": 248044,
11
  "text_config": {
@@ -13,7 +13,7 @@
13
  "attention_dropout": 0.0,
14
  "attn_output_gate": true,
15
  "bos_token_id": null,
16
- "torch_dtype": "bfloat16",
17
  "eos_token_id": 248044,
18
  "full_attention_interval": 4,
19
  "head_dim": 256,
@@ -80,13 +80,13 @@
80
  "vocab_size": 248320
81
  },
82
  "tie_word_embeddings": true,
83
- "unsloth_version": "2026.3.4",
84
  "use_cache": false,
85
  "video_token_id": 248057,
86
  "vision_config": {
87
  "deepstack_visual_indexes": [],
88
  "depth": 24,
89
- "torch_dtype": "bfloat16",
90
  "hidden_act": "gelu_pytorch_tanh",
91
  "hidden_size": 1024,
92
  "in_channels": 3,
 
2
  "architectures": [
3
  "Qwen3_5ForConditionalGeneration"
4
  ],
5
+ "torch_dtype": "float16",
6
  "eos_token_id": 248046,
7
  "image_token_id": 248056,
8
+ "model_name": "Qwen/Qwen3.5-2B",
9
  "model_type": "qwen3_5",
10
  "pad_token_id": 248044,
11
  "text_config": {
 
13
  "attention_dropout": 0.0,
14
  "attn_output_gate": true,
15
  "bos_token_id": null,
16
+ "torch_dtype": "float16",
17
  "eos_token_id": 248044,
18
  "full_attention_interval": 4,
19
  "head_dim": 256,
 
80
  "vocab_size": 248320
81
  },
82
  "tie_word_embeddings": true,
83
+ "unsloth_version": "2026.4.4",
84
  "use_cache": false,
85
  "video_token_id": 248057,
86
  "vision_config": {
87
  "deepstack_visual_indexes": [],
88
  "depth": 24,
89
+ "torch_dtype": "float16",
90
  "hidden_act": "gelu_pytorch_tanh",
91
  "hidden_size": 1024,
92
  "in_channels": 3,
model.safetensors-00001-of-00001.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:023401fe5ec3ddf5e96ba5b8bd24338883a699cf2d0ff8bd9a3aa59a45191030
3
  size 4548221488
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad792be39c3ce73bea7e97137d32cdab8b23ada325184758bd657ed4f7d9c995
3
  size 4548221488