Image-Text-to-Text
Transformers
Safetensors
Telugu
gemma4
gemma
telugu
medical
grpo
merged
healthcare
conversational
Instructions to use RohithMidigudla/aarogya_gemma_telugu_medical with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use RohithMidigudla/aarogya_gemma_telugu_medical with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("image-text-to-text", model="RohithMidigudla/aarogya_gemma_telugu_medical") messages = [ { "role": "user", "content": [ {"type": "image", "url": "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/p-blog/candy.JPG"}, {"type": "text", "text": "What animal is on the candy?"} ] }, ] pipe(text=messages)# Load model directly from transformers import AutoProcessor, AutoModelForMultimodalLM processor = AutoProcessor.from_pretrained("RohithMidigudla/aarogya_gemma_telugu_medical") model = AutoModelForMultimodalLM.from_pretrained("RohithMidigudla/aarogya_gemma_telugu_medical") messages = [ { "role": "user", "content": [ {"type": "image", "url": "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/p-blog/candy.JPG"}, {"type": "text", "text": "What animal is on the candy?"} ] }, ] inputs = processor.apply_chat_template( messages, add_generation_prompt=True, tokenize=True, return_dict=True, return_tensors="pt", ).to(model.device) outputs = model.generate(**inputs, max_new_tokens=40) print(processor.decode(outputs[0][inputs["input_ids"].shape[-1]:])) - Notebooks
- Google Colab
- Kaggle
- Local Apps Settings
- vLLM
How to use RohithMidigudla/aarogya_gemma_telugu_medical with vLLM:
Install from pip and serve model
# Install vLLM from pip: pip install vllm # Start the vLLM server: vllm serve "RohithMidigudla/aarogya_gemma_telugu_medical" # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:8000/v1/chat/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "RohithMidigudla/aarogya_gemma_telugu_medical", "messages": [ { "role": "user", "content": [ { "type": "text", "text": "Describe this image in one sentence." }, { "type": "image_url", "image_url": { "url": "https://cdn.britannica.com/61/93061-050-99147DCE/Statue-of-Liberty-Island-New-York-Bay.jpg" } } ] } ] }'Use Docker
docker model run hf.co/RohithMidigudla/aarogya_gemma_telugu_medical
- SGLang
How to use RohithMidigudla/aarogya_gemma_telugu_medical with SGLang:
Install from pip and serve model
# Install SGLang from pip: pip install sglang # Start the SGLang server: python3 -m sglang.launch_server \ --model-path "RohithMidigudla/aarogya_gemma_telugu_medical" \ --host 0.0.0.0 \ --port 30000 # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:30000/v1/chat/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "RohithMidigudla/aarogya_gemma_telugu_medical", "messages": [ { "role": "user", "content": [ { "type": "text", "text": "Describe this image in one sentence." }, { "type": "image_url", "image_url": { "url": "https://cdn.britannica.com/61/93061-050-99147DCE/Statue-of-Liberty-Island-New-York-Bay.jpg" } } ] } ] }'Use Docker images
docker run --gpus all \ --shm-size 32g \ -p 30000:30000 \ -v ~/.cache/huggingface:/root/.cache/huggingface \ --env "HF_TOKEN=<secret>" \ --ipc=host \ lmsysorg/sglang:latest \ python3 -m sglang.launch_server \ --model-path "RohithMidigudla/aarogya_gemma_telugu_medical" \ --host 0.0.0.0 \ --port 30000 # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:30000/v1/chat/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "RohithMidigudla/aarogya_gemma_telugu_medical", "messages": [ { "role": "user", "content": [ { "type": "text", "text": "Describe this image in one sentence." }, { "type": "image_url", "image_url": { "url": "https://cdn.britannica.com/61/93061-050-99147DCE/Statue-of-Liberty-Island-New-York-Bay.jpg" } } ] } ] }' - Docker Model Runner
How to use RohithMidigudla/aarogya_gemma_telugu_medical with Docker Model Runner:
docker model run hf.co/RohithMidigudla/aarogya_gemma_telugu_medical
Add files using upload-large-folder tool
Browse files
model-missing-base.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2034aab30f47d55d7ec21f597273124453f9cb152690b0d504e77ca28ce3266
|
| 3 |
+
size 110118080
|
model.safetensors.index.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
"total_parameters": 7941100832,
|
| 4 |
-
"total_size":
|
| 5 |
},
|
| 6 |
"weight_map": {
|
| 7 |
"model.audio_tower.layers.0.feed_forward1.ffw_layer_1.input_max": "model-00002-of-00004.safetensors",
|
|
@@ -1059,9 +1059,12 @@
|
|
| 1059 |
"model.language_model.layers.24.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1060 |
"model.language_model.layers.24.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1061 |
"model.language_model.layers.24.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1062 |
"model.language_model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1063 |
"model.language_model.layers.24.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1064 |
"model.language_model.layers.24.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1065 |
"model.language_model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1066 |
"model.language_model.layers.25.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1067 |
"model.language_model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1073,9 +1076,12 @@
|
|
| 1073 |
"model.language_model.layers.25.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1074 |
"model.language_model.layers.25.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1075 |
"model.language_model.layers.25.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1076 |
"model.language_model.layers.25.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1077 |
"model.language_model.layers.25.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1078 |
"model.language_model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1079 |
"model.language_model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1080 |
"model.language_model.layers.26.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1081 |
"model.language_model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1087,9 +1093,12 @@
|
|
| 1087 |
"model.language_model.layers.26.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1088 |
"model.language_model.layers.26.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1089 |
"model.language_model.layers.26.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1090 |
"model.language_model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1091 |
"model.language_model.layers.26.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1092 |
"model.language_model.layers.26.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1093 |
"model.language_model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1094 |
"model.language_model.layers.27.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1095 |
"model.language_model.layers.27.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1101,9 +1110,12 @@
|
|
| 1101 |
"model.language_model.layers.27.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1102 |
"model.language_model.layers.27.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1103 |
"model.language_model.layers.27.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1104 |
"model.language_model.layers.27.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1105 |
"model.language_model.layers.27.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1106 |
"model.language_model.layers.27.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1107 |
"model.language_model.layers.28.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1108 |
"model.language_model.layers.28.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1109 |
"model.language_model.layers.28.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1115,9 +1127,12 @@
|
|
| 1115 |
"model.language_model.layers.28.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1116 |
"model.language_model.layers.28.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1117 |
"model.language_model.layers.28.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1118 |
"model.language_model.layers.28.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1119 |
"model.language_model.layers.28.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1120 |
"model.language_model.layers.28.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1121 |
"model.language_model.layers.29.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1122 |
"model.language_model.layers.29.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1123 |
"model.language_model.layers.29.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1129,9 +1144,12 @@
|
|
| 1129 |
"model.language_model.layers.29.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1130 |
"model.language_model.layers.29.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1131 |
"model.language_model.layers.29.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1132 |
"model.language_model.layers.29.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1133 |
"model.language_model.layers.29.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1134 |
"model.language_model.layers.29.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1135 |
"model.language_model.layers.3.input_layernorm.weight": "model-00002-of-00004.safetensors",
|
| 1136 |
"model.language_model.layers.3.layer_scalar": "model-00002-of-00004.safetensors",
|
| 1137 |
"model.language_model.layers.3.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
|
|
@@ -1160,9 +1178,12 @@
|
|
| 1160 |
"model.language_model.layers.30.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1161 |
"model.language_model.layers.30.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1162 |
"model.language_model.layers.30.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1163 |
"model.language_model.layers.30.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1164 |
"model.language_model.layers.30.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1165 |
"model.language_model.layers.30.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1166 |
"model.language_model.layers.31.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1167 |
"model.language_model.layers.31.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1168 |
"model.language_model.layers.31.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1174,9 +1195,12 @@
|
|
| 1174 |
"model.language_model.layers.31.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1175 |
"model.language_model.layers.31.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1176 |
"model.language_model.layers.31.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1177 |
"model.language_model.layers.31.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1178 |
"model.language_model.layers.31.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1179 |
"model.language_model.layers.31.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1180 |
"model.language_model.layers.32.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1181 |
"model.language_model.layers.32.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1182 |
"model.language_model.layers.32.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1188,9 +1212,12 @@
|
|
| 1188 |
"model.language_model.layers.32.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1189 |
"model.language_model.layers.32.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1190 |
"model.language_model.layers.32.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1191 |
"model.language_model.layers.32.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1192 |
"model.language_model.layers.32.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1193 |
"model.language_model.layers.32.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1194 |
"model.language_model.layers.33.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1195 |
"model.language_model.layers.33.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1196 |
"model.language_model.layers.33.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1202,9 +1229,12 @@
|
|
| 1202 |
"model.language_model.layers.33.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1203 |
"model.language_model.layers.33.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1204 |
"model.language_model.layers.33.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1205 |
"model.language_model.layers.33.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1206 |
"model.language_model.layers.33.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1207 |
"model.language_model.layers.33.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1208 |
"model.language_model.layers.34.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1209 |
"model.language_model.layers.34.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1210 |
"model.language_model.layers.34.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1216,9 +1246,12 @@
|
|
| 1216 |
"model.language_model.layers.34.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1217 |
"model.language_model.layers.34.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1218 |
"model.language_model.layers.34.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1219 |
"model.language_model.layers.34.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1220 |
"model.language_model.layers.34.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1221 |
"model.language_model.layers.34.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1222 |
"model.language_model.layers.35.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1223 |
"model.language_model.layers.35.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1224 |
"model.language_model.layers.35.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1230,9 +1263,12 @@
|
|
| 1230 |
"model.language_model.layers.35.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1231 |
"model.language_model.layers.35.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1232 |
"model.language_model.layers.35.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1233 |
"model.language_model.layers.35.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1234 |
"model.language_model.layers.35.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1235 |
"model.language_model.layers.35.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1236 |
"model.language_model.layers.36.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1237 |
"model.language_model.layers.36.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1238 |
"model.language_model.layers.36.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1244,9 +1280,12 @@
|
|
| 1244 |
"model.language_model.layers.36.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1245 |
"model.language_model.layers.36.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1246 |
"model.language_model.layers.36.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1247 |
"model.language_model.layers.36.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1248 |
"model.language_model.layers.36.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1249 |
"model.language_model.layers.36.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1250 |
"model.language_model.layers.37.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1251 |
"model.language_model.layers.37.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1252 |
"model.language_model.layers.37.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1258,9 +1297,12 @@
|
|
| 1258 |
"model.language_model.layers.37.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1259 |
"model.language_model.layers.37.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1260 |
"model.language_model.layers.37.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1261 |
"model.language_model.layers.37.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1262 |
"model.language_model.layers.37.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1263 |
"model.language_model.layers.37.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1264 |
"model.language_model.layers.38.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1265 |
"model.language_model.layers.38.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1266 |
"model.language_model.layers.38.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1272,9 +1314,12 @@
|
|
| 1272 |
"model.language_model.layers.38.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1273 |
"model.language_model.layers.38.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1274 |
"model.language_model.layers.38.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1275 |
"model.language_model.layers.38.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1276 |
"model.language_model.layers.38.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1277 |
"model.language_model.layers.38.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1278 |
"model.language_model.layers.39.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1279 |
"model.language_model.layers.39.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1280 |
"model.language_model.layers.39.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1286,9 +1331,12 @@
|
|
| 1286 |
"model.language_model.layers.39.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1287 |
"model.language_model.layers.39.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1288 |
"model.language_model.layers.39.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1289 |
"model.language_model.layers.39.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1290 |
"model.language_model.layers.39.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1291 |
"model.language_model.layers.39.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1292 |
"model.language_model.layers.4.input_layernorm.weight": "model-00002-of-00004.safetensors",
|
| 1293 |
"model.language_model.layers.4.layer_scalar": "model-00002-of-00004.safetensors",
|
| 1294 |
"model.language_model.layers.4.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
|
|
@@ -1317,9 +1365,12 @@
|
|
| 1317 |
"model.language_model.layers.40.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1318 |
"model.language_model.layers.40.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1319 |
"model.language_model.layers.40.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1320 |
"model.language_model.layers.40.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1321 |
"model.language_model.layers.40.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1322 |
"model.language_model.layers.40.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1323 |
"model.language_model.layers.41.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1324 |
"model.language_model.layers.41.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1325 |
"model.language_model.layers.41.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
@@ -1331,9 +1382,12 @@
|
|
| 1331 |
"model.language_model.layers.41.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1332 |
"model.language_model.layers.41.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1333 |
"model.language_model.layers.41.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
|
|
|
|
|
|
| 1334 |
"model.language_model.layers.41.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1335 |
"model.language_model.layers.41.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1336 |
"model.language_model.layers.41.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1337 |
"model.language_model.layers.5.input_layernorm.weight": "model-00002-of-00004.safetensors",
|
| 1338 |
"model.language_model.layers.5.layer_scalar": "model-00002-of-00004.safetensors",
|
| 1339 |
"model.language_model.layers.5.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
|
|
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
"total_parameters": 7941100832,
|
| 4 |
+
"total_size": 15992314836
|
| 5 |
},
|
| 6 |
"weight_map": {
|
| 7 |
"model.audio_tower.layers.0.feed_forward1.ffw_layer_1.input_max": "model-00002-of-00004.safetensors",
|
|
|
|
| 1059 |
"model.language_model.layers.24.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1060 |
"model.language_model.layers.24.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1061 |
"model.language_model.layers.24.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1062 |
+
"model.language_model.layers.24.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1063 |
+
"model.language_model.layers.24.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1064 |
"model.language_model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1065 |
"model.language_model.layers.24.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1066 |
"model.language_model.layers.24.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1067 |
+
"model.language_model.layers.24.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1068 |
"model.language_model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1069 |
"model.language_model.layers.25.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1070 |
"model.language_model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1076 |
"model.language_model.layers.25.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1077 |
"model.language_model.layers.25.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1078 |
"model.language_model.layers.25.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1079 |
+
"model.language_model.layers.25.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1080 |
+
"model.language_model.layers.25.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1081 |
"model.language_model.layers.25.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1082 |
"model.language_model.layers.25.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1083 |
"model.language_model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1084 |
+
"model.language_model.layers.25.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1085 |
"model.language_model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1086 |
"model.language_model.layers.26.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1087 |
"model.language_model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1093 |
"model.language_model.layers.26.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1094 |
"model.language_model.layers.26.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1095 |
"model.language_model.layers.26.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1096 |
+
"model.language_model.layers.26.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1097 |
+
"model.language_model.layers.26.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1098 |
"model.language_model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1099 |
"model.language_model.layers.26.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1100 |
"model.language_model.layers.26.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1101 |
+
"model.language_model.layers.26.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1102 |
"model.language_model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1103 |
"model.language_model.layers.27.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1104 |
"model.language_model.layers.27.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1110 |
"model.language_model.layers.27.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1111 |
"model.language_model.layers.27.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1112 |
"model.language_model.layers.27.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1113 |
+
"model.language_model.layers.27.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1114 |
+
"model.language_model.layers.27.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1115 |
"model.language_model.layers.27.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1116 |
"model.language_model.layers.27.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1117 |
"model.language_model.layers.27.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1118 |
+
"model.language_model.layers.27.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1119 |
"model.language_model.layers.28.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1120 |
"model.language_model.layers.28.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1121 |
"model.language_model.layers.28.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1127 |
"model.language_model.layers.28.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1128 |
"model.language_model.layers.28.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1129 |
"model.language_model.layers.28.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1130 |
+
"model.language_model.layers.28.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1131 |
+
"model.language_model.layers.28.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1132 |
"model.language_model.layers.28.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1133 |
"model.language_model.layers.28.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1134 |
"model.language_model.layers.28.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1135 |
+
"model.language_model.layers.28.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1136 |
"model.language_model.layers.29.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1137 |
"model.language_model.layers.29.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1138 |
"model.language_model.layers.29.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1144 |
"model.language_model.layers.29.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1145 |
"model.language_model.layers.29.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1146 |
"model.language_model.layers.29.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1147 |
+
"model.language_model.layers.29.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1148 |
+
"model.language_model.layers.29.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1149 |
"model.language_model.layers.29.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1150 |
"model.language_model.layers.29.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1151 |
"model.language_model.layers.29.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1152 |
+
"model.language_model.layers.29.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1153 |
"model.language_model.layers.3.input_layernorm.weight": "model-00002-of-00004.safetensors",
|
| 1154 |
"model.language_model.layers.3.layer_scalar": "model-00002-of-00004.safetensors",
|
| 1155 |
"model.language_model.layers.3.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
|
|
|
|
| 1178 |
"model.language_model.layers.30.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1179 |
"model.language_model.layers.30.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1180 |
"model.language_model.layers.30.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1181 |
+
"model.language_model.layers.30.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1182 |
+
"model.language_model.layers.30.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1183 |
"model.language_model.layers.30.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1184 |
"model.language_model.layers.30.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1185 |
"model.language_model.layers.30.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1186 |
+
"model.language_model.layers.30.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1187 |
"model.language_model.layers.31.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1188 |
"model.language_model.layers.31.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1189 |
"model.language_model.layers.31.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1195 |
"model.language_model.layers.31.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1196 |
"model.language_model.layers.31.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1197 |
"model.language_model.layers.31.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1198 |
+
"model.language_model.layers.31.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1199 |
+
"model.language_model.layers.31.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1200 |
"model.language_model.layers.31.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1201 |
"model.language_model.layers.31.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1202 |
"model.language_model.layers.31.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1203 |
+
"model.language_model.layers.31.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1204 |
"model.language_model.layers.32.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1205 |
"model.language_model.layers.32.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1206 |
"model.language_model.layers.32.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1212 |
"model.language_model.layers.32.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1213 |
"model.language_model.layers.32.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1214 |
"model.language_model.layers.32.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1215 |
+
"model.language_model.layers.32.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1216 |
+
"model.language_model.layers.32.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1217 |
"model.language_model.layers.32.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1218 |
"model.language_model.layers.32.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1219 |
"model.language_model.layers.32.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1220 |
+
"model.language_model.layers.32.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1221 |
"model.language_model.layers.33.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1222 |
"model.language_model.layers.33.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1223 |
"model.language_model.layers.33.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1229 |
"model.language_model.layers.33.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1230 |
"model.language_model.layers.33.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1231 |
"model.language_model.layers.33.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1232 |
+
"model.language_model.layers.33.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1233 |
+
"model.language_model.layers.33.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1234 |
"model.language_model.layers.33.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1235 |
"model.language_model.layers.33.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1236 |
"model.language_model.layers.33.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1237 |
+
"model.language_model.layers.33.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1238 |
"model.language_model.layers.34.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1239 |
"model.language_model.layers.34.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1240 |
"model.language_model.layers.34.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1246 |
"model.language_model.layers.34.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1247 |
"model.language_model.layers.34.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1248 |
"model.language_model.layers.34.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1249 |
+
"model.language_model.layers.34.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1250 |
+
"model.language_model.layers.34.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1251 |
"model.language_model.layers.34.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1252 |
"model.language_model.layers.34.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1253 |
"model.language_model.layers.34.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1254 |
+
"model.language_model.layers.34.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1255 |
"model.language_model.layers.35.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1256 |
"model.language_model.layers.35.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1257 |
"model.language_model.layers.35.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1263 |
"model.language_model.layers.35.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1264 |
"model.language_model.layers.35.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1265 |
"model.language_model.layers.35.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1266 |
+
"model.language_model.layers.35.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1267 |
+
"model.language_model.layers.35.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1268 |
"model.language_model.layers.35.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1269 |
"model.language_model.layers.35.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1270 |
"model.language_model.layers.35.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1271 |
+
"model.language_model.layers.35.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1272 |
"model.language_model.layers.36.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1273 |
"model.language_model.layers.36.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1274 |
"model.language_model.layers.36.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1280 |
"model.language_model.layers.36.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1281 |
"model.language_model.layers.36.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1282 |
"model.language_model.layers.36.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1283 |
+
"model.language_model.layers.36.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1284 |
+
"model.language_model.layers.36.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1285 |
"model.language_model.layers.36.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1286 |
"model.language_model.layers.36.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1287 |
"model.language_model.layers.36.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1288 |
+
"model.language_model.layers.36.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1289 |
"model.language_model.layers.37.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1290 |
"model.language_model.layers.37.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1291 |
"model.language_model.layers.37.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1297 |
"model.language_model.layers.37.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1298 |
"model.language_model.layers.37.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1299 |
"model.language_model.layers.37.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1300 |
+
"model.language_model.layers.37.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1301 |
+
"model.language_model.layers.37.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1302 |
"model.language_model.layers.37.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1303 |
"model.language_model.layers.37.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1304 |
"model.language_model.layers.37.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1305 |
+
"model.language_model.layers.37.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1306 |
"model.language_model.layers.38.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1307 |
"model.language_model.layers.38.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1308 |
"model.language_model.layers.38.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1314 |
"model.language_model.layers.38.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1315 |
"model.language_model.layers.38.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1316 |
"model.language_model.layers.38.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1317 |
+
"model.language_model.layers.38.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1318 |
+
"model.language_model.layers.38.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1319 |
"model.language_model.layers.38.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1320 |
"model.language_model.layers.38.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1321 |
"model.language_model.layers.38.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1322 |
+
"model.language_model.layers.38.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1323 |
"model.language_model.layers.39.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1324 |
"model.language_model.layers.39.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1325 |
"model.language_model.layers.39.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1331 |
"model.language_model.layers.39.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1332 |
"model.language_model.layers.39.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1333 |
"model.language_model.layers.39.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1334 |
+
"model.language_model.layers.39.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1335 |
+
"model.language_model.layers.39.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1336 |
"model.language_model.layers.39.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1337 |
"model.language_model.layers.39.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1338 |
"model.language_model.layers.39.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1339 |
+
"model.language_model.layers.39.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1340 |
"model.language_model.layers.4.input_layernorm.weight": "model-00002-of-00004.safetensors",
|
| 1341 |
"model.language_model.layers.4.layer_scalar": "model-00002-of-00004.safetensors",
|
| 1342 |
"model.language_model.layers.4.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
|
|
|
|
| 1365 |
"model.language_model.layers.40.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1366 |
"model.language_model.layers.40.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1367 |
"model.language_model.layers.40.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1368 |
+
"model.language_model.layers.40.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1369 |
+
"model.language_model.layers.40.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1370 |
"model.language_model.layers.40.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1371 |
"model.language_model.layers.40.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1372 |
"model.language_model.layers.40.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1373 |
+
"model.language_model.layers.40.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1374 |
"model.language_model.layers.41.input_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1375 |
"model.language_model.layers.41.layer_scalar": "model-00003-of-00004.safetensors",
|
| 1376 |
"model.language_model.layers.41.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
|
|
|
|
| 1382 |
"model.language_model.layers.41.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1383 |
"model.language_model.layers.41.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
|
| 1384 |
"model.language_model.layers.41.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
|
| 1385 |
+
"model.language_model.layers.41.self_attn.k_norm.weight": "model-missing-base.safetensors",
|
| 1386 |
+
"model.language_model.layers.41.self_attn.k_proj.weight": "model-missing-base.safetensors",
|
| 1387 |
"model.language_model.layers.41.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
|
| 1388 |
"model.language_model.layers.41.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
|
| 1389 |
"model.language_model.layers.41.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
|
| 1390 |
+
"model.language_model.layers.41.self_attn.v_proj.weight": "model-missing-base.safetensors",
|
| 1391 |
"model.language_model.layers.5.input_layernorm.weight": "model-00002-of-00004.safetensors",
|
| 1392 |
"model.language_model.layers.5.layer_scalar": "model-00002-of-00004.safetensors",
|
| 1393 |
"model.language_model.layers.5.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
|