RohithMidigudla commited on
Commit
52d3c53
·
verified ·
1 Parent(s): 2b97958

Add files using upload-large-folder tool

Browse files
model-missing-base.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2034aab30f47d55d7ec21f597273124453f9cb152690b0d504e77ca28ce3266
3
+ size 110118080
model.safetensors.index.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "metadata": {
3
  "total_parameters": 7941100832,
4
- "total_size": 15882203604
5
  },
6
  "weight_map": {
7
  "model.audio_tower.layers.0.feed_forward1.ffw_layer_1.input_max": "model-00002-of-00004.safetensors",
@@ -1059,9 +1059,12 @@
1059
  "model.language_model.layers.24.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1060
  "model.language_model.layers.24.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1061
  "model.language_model.layers.24.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1062
  "model.language_model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1063
  "model.language_model.layers.24.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1064
  "model.language_model.layers.24.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1065
  "model.language_model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors",
1066
  "model.language_model.layers.25.layer_scalar": "model-00003-of-00004.safetensors",
1067
  "model.language_model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1073,9 +1076,12 @@
1073
  "model.language_model.layers.25.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1074
  "model.language_model.layers.25.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1075
  "model.language_model.layers.25.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1076
  "model.language_model.layers.25.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1077
  "model.language_model.layers.25.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1078
  "model.language_model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1079
  "model.language_model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors",
1080
  "model.language_model.layers.26.layer_scalar": "model-00003-of-00004.safetensors",
1081
  "model.language_model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1087,9 +1093,12 @@
1087
  "model.language_model.layers.26.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1088
  "model.language_model.layers.26.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1089
  "model.language_model.layers.26.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1090
  "model.language_model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1091
  "model.language_model.layers.26.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1092
  "model.language_model.layers.26.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1093
  "model.language_model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors",
1094
  "model.language_model.layers.27.layer_scalar": "model-00003-of-00004.safetensors",
1095
  "model.language_model.layers.27.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1101,9 +1110,12 @@
1101
  "model.language_model.layers.27.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1102
  "model.language_model.layers.27.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1103
  "model.language_model.layers.27.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1104
  "model.language_model.layers.27.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1105
  "model.language_model.layers.27.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1106
  "model.language_model.layers.27.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1107
  "model.language_model.layers.28.input_layernorm.weight": "model-00003-of-00004.safetensors",
1108
  "model.language_model.layers.28.layer_scalar": "model-00003-of-00004.safetensors",
1109
  "model.language_model.layers.28.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1115,9 +1127,12 @@
1115
  "model.language_model.layers.28.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1116
  "model.language_model.layers.28.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1117
  "model.language_model.layers.28.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1118
  "model.language_model.layers.28.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1119
  "model.language_model.layers.28.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1120
  "model.language_model.layers.28.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1121
  "model.language_model.layers.29.input_layernorm.weight": "model-00003-of-00004.safetensors",
1122
  "model.language_model.layers.29.layer_scalar": "model-00003-of-00004.safetensors",
1123
  "model.language_model.layers.29.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1129,9 +1144,12 @@
1129
  "model.language_model.layers.29.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1130
  "model.language_model.layers.29.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1131
  "model.language_model.layers.29.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1132
  "model.language_model.layers.29.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1133
  "model.language_model.layers.29.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1134
  "model.language_model.layers.29.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1135
  "model.language_model.layers.3.input_layernorm.weight": "model-00002-of-00004.safetensors",
1136
  "model.language_model.layers.3.layer_scalar": "model-00002-of-00004.safetensors",
1137
  "model.language_model.layers.3.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
@@ -1160,9 +1178,12 @@
1160
  "model.language_model.layers.30.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1161
  "model.language_model.layers.30.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1162
  "model.language_model.layers.30.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1163
  "model.language_model.layers.30.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1164
  "model.language_model.layers.30.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1165
  "model.language_model.layers.30.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1166
  "model.language_model.layers.31.input_layernorm.weight": "model-00003-of-00004.safetensors",
1167
  "model.language_model.layers.31.layer_scalar": "model-00003-of-00004.safetensors",
1168
  "model.language_model.layers.31.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1174,9 +1195,12 @@
1174
  "model.language_model.layers.31.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1175
  "model.language_model.layers.31.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1176
  "model.language_model.layers.31.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1177
  "model.language_model.layers.31.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1178
  "model.language_model.layers.31.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1179
  "model.language_model.layers.31.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1180
  "model.language_model.layers.32.input_layernorm.weight": "model-00003-of-00004.safetensors",
1181
  "model.language_model.layers.32.layer_scalar": "model-00003-of-00004.safetensors",
1182
  "model.language_model.layers.32.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1188,9 +1212,12 @@
1188
  "model.language_model.layers.32.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1189
  "model.language_model.layers.32.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1190
  "model.language_model.layers.32.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1191
  "model.language_model.layers.32.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1192
  "model.language_model.layers.32.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1193
  "model.language_model.layers.32.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1194
  "model.language_model.layers.33.input_layernorm.weight": "model-00003-of-00004.safetensors",
1195
  "model.language_model.layers.33.layer_scalar": "model-00003-of-00004.safetensors",
1196
  "model.language_model.layers.33.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1202,9 +1229,12 @@
1202
  "model.language_model.layers.33.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1203
  "model.language_model.layers.33.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1204
  "model.language_model.layers.33.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1205
  "model.language_model.layers.33.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1206
  "model.language_model.layers.33.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1207
  "model.language_model.layers.33.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1208
  "model.language_model.layers.34.input_layernorm.weight": "model-00003-of-00004.safetensors",
1209
  "model.language_model.layers.34.layer_scalar": "model-00003-of-00004.safetensors",
1210
  "model.language_model.layers.34.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1216,9 +1246,12 @@
1216
  "model.language_model.layers.34.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1217
  "model.language_model.layers.34.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1218
  "model.language_model.layers.34.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1219
  "model.language_model.layers.34.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1220
  "model.language_model.layers.34.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1221
  "model.language_model.layers.34.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1222
  "model.language_model.layers.35.input_layernorm.weight": "model-00003-of-00004.safetensors",
1223
  "model.language_model.layers.35.layer_scalar": "model-00003-of-00004.safetensors",
1224
  "model.language_model.layers.35.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1230,9 +1263,12 @@
1230
  "model.language_model.layers.35.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1231
  "model.language_model.layers.35.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1232
  "model.language_model.layers.35.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1233
  "model.language_model.layers.35.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1234
  "model.language_model.layers.35.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1235
  "model.language_model.layers.35.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1236
  "model.language_model.layers.36.input_layernorm.weight": "model-00003-of-00004.safetensors",
1237
  "model.language_model.layers.36.layer_scalar": "model-00003-of-00004.safetensors",
1238
  "model.language_model.layers.36.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1244,9 +1280,12 @@
1244
  "model.language_model.layers.36.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1245
  "model.language_model.layers.36.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1246
  "model.language_model.layers.36.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1247
  "model.language_model.layers.36.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1248
  "model.language_model.layers.36.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1249
  "model.language_model.layers.36.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1250
  "model.language_model.layers.37.input_layernorm.weight": "model-00003-of-00004.safetensors",
1251
  "model.language_model.layers.37.layer_scalar": "model-00003-of-00004.safetensors",
1252
  "model.language_model.layers.37.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1258,9 +1297,12 @@
1258
  "model.language_model.layers.37.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1259
  "model.language_model.layers.37.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1260
  "model.language_model.layers.37.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1261
  "model.language_model.layers.37.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1262
  "model.language_model.layers.37.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1263
  "model.language_model.layers.37.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1264
  "model.language_model.layers.38.input_layernorm.weight": "model-00003-of-00004.safetensors",
1265
  "model.language_model.layers.38.layer_scalar": "model-00003-of-00004.safetensors",
1266
  "model.language_model.layers.38.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1272,9 +1314,12 @@
1272
  "model.language_model.layers.38.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1273
  "model.language_model.layers.38.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1274
  "model.language_model.layers.38.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1275
  "model.language_model.layers.38.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1276
  "model.language_model.layers.38.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1277
  "model.language_model.layers.38.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1278
  "model.language_model.layers.39.input_layernorm.weight": "model-00003-of-00004.safetensors",
1279
  "model.language_model.layers.39.layer_scalar": "model-00003-of-00004.safetensors",
1280
  "model.language_model.layers.39.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1286,9 +1331,12 @@
1286
  "model.language_model.layers.39.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1287
  "model.language_model.layers.39.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1288
  "model.language_model.layers.39.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1289
  "model.language_model.layers.39.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1290
  "model.language_model.layers.39.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1291
  "model.language_model.layers.39.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1292
  "model.language_model.layers.4.input_layernorm.weight": "model-00002-of-00004.safetensors",
1293
  "model.language_model.layers.4.layer_scalar": "model-00002-of-00004.safetensors",
1294
  "model.language_model.layers.4.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
@@ -1317,9 +1365,12 @@
1317
  "model.language_model.layers.40.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1318
  "model.language_model.layers.40.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1319
  "model.language_model.layers.40.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1320
  "model.language_model.layers.40.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1321
  "model.language_model.layers.40.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1322
  "model.language_model.layers.40.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1323
  "model.language_model.layers.41.input_layernorm.weight": "model-00003-of-00004.safetensors",
1324
  "model.language_model.layers.41.layer_scalar": "model-00003-of-00004.safetensors",
1325
  "model.language_model.layers.41.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
@@ -1331,9 +1382,12 @@
1331
  "model.language_model.layers.41.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1332
  "model.language_model.layers.41.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1333
  "model.language_model.layers.41.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
 
 
1334
  "model.language_model.layers.41.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1335
  "model.language_model.layers.41.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1336
  "model.language_model.layers.41.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
 
1337
  "model.language_model.layers.5.input_layernorm.weight": "model-00002-of-00004.safetensors",
1338
  "model.language_model.layers.5.layer_scalar": "model-00002-of-00004.safetensors",
1339
  "model.language_model.layers.5.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
 
1
  {
2
  "metadata": {
3
  "total_parameters": 7941100832,
4
+ "total_size": 15992314836
5
  },
6
  "weight_map": {
7
  "model.audio_tower.layers.0.feed_forward1.ffw_layer_1.input_max": "model-00002-of-00004.safetensors",
 
1059
  "model.language_model.layers.24.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1060
  "model.language_model.layers.24.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1061
  "model.language_model.layers.24.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1062
+ "model.language_model.layers.24.self_attn.k_norm.weight": "model-missing-base.safetensors",
1063
+ "model.language_model.layers.24.self_attn.k_proj.weight": "model-missing-base.safetensors",
1064
  "model.language_model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1065
  "model.language_model.layers.24.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1066
  "model.language_model.layers.24.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1067
+ "model.language_model.layers.24.self_attn.v_proj.weight": "model-missing-base.safetensors",
1068
  "model.language_model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors",
1069
  "model.language_model.layers.25.layer_scalar": "model-00003-of-00004.safetensors",
1070
  "model.language_model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1076
  "model.language_model.layers.25.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1077
  "model.language_model.layers.25.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1078
  "model.language_model.layers.25.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1079
+ "model.language_model.layers.25.self_attn.k_norm.weight": "model-missing-base.safetensors",
1080
+ "model.language_model.layers.25.self_attn.k_proj.weight": "model-missing-base.safetensors",
1081
  "model.language_model.layers.25.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1082
  "model.language_model.layers.25.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1083
  "model.language_model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1084
+ "model.language_model.layers.25.self_attn.v_proj.weight": "model-missing-base.safetensors",
1085
  "model.language_model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors",
1086
  "model.language_model.layers.26.layer_scalar": "model-00003-of-00004.safetensors",
1087
  "model.language_model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1093
  "model.language_model.layers.26.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1094
  "model.language_model.layers.26.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1095
  "model.language_model.layers.26.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1096
+ "model.language_model.layers.26.self_attn.k_norm.weight": "model-missing-base.safetensors",
1097
+ "model.language_model.layers.26.self_attn.k_proj.weight": "model-missing-base.safetensors",
1098
  "model.language_model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1099
  "model.language_model.layers.26.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1100
  "model.language_model.layers.26.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1101
+ "model.language_model.layers.26.self_attn.v_proj.weight": "model-missing-base.safetensors",
1102
  "model.language_model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors",
1103
  "model.language_model.layers.27.layer_scalar": "model-00003-of-00004.safetensors",
1104
  "model.language_model.layers.27.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1110
  "model.language_model.layers.27.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1111
  "model.language_model.layers.27.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1112
  "model.language_model.layers.27.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1113
+ "model.language_model.layers.27.self_attn.k_norm.weight": "model-missing-base.safetensors",
1114
+ "model.language_model.layers.27.self_attn.k_proj.weight": "model-missing-base.safetensors",
1115
  "model.language_model.layers.27.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1116
  "model.language_model.layers.27.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1117
  "model.language_model.layers.27.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1118
+ "model.language_model.layers.27.self_attn.v_proj.weight": "model-missing-base.safetensors",
1119
  "model.language_model.layers.28.input_layernorm.weight": "model-00003-of-00004.safetensors",
1120
  "model.language_model.layers.28.layer_scalar": "model-00003-of-00004.safetensors",
1121
  "model.language_model.layers.28.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1127
  "model.language_model.layers.28.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1128
  "model.language_model.layers.28.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1129
  "model.language_model.layers.28.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1130
+ "model.language_model.layers.28.self_attn.k_norm.weight": "model-missing-base.safetensors",
1131
+ "model.language_model.layers.28.self_attn.k_proj.weight": "model-missing-base.safetensors",
1132
  "model.language_model.layers.28.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1133
  "model.language_model.layers.28.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1134
  "model.language_model.layers.28.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1135
+ "model.language_model.layers.28.self_attn.v_proj.weight": "model-missing-base.safetensors",
1136
  "model.language_model.layers.29.input_layernorm.weight": "model-00003-of-00004.safetensors",
1137
  "model.language_model.layers.29.layer_scalar": "model-00003-of-00004.safetensors",
1138
  "model.language_model.layers.29.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1144
  "model.language_model.layers.29.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1145
  "model.language_model.layers.29.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1146
  "model.language_model.layers.29.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1147
+ "model.language_model.layers.29.self_attn.k_norm.weight": "model-missing-base.safetensors",
1148
+ "model.language_model.layers.29.self_attn.k_proj.weight": "model-missing-base.safetensors",
1149
  "model.language_model.layers.29.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1150
  "model.language_model.layers.29.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1151
  "model.language_model.layers.29.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1152
+ "model.language_model.layers.29.self_attn.v_proj.weight": "model-missing-base.safetensors",
1153
  "model.language_model.layers.3.input_layernorm.weight": "model-00002-of-00004.safetensors",
1154
  "model.language_model.layers.3.layer_scalar": "model-00002-of-00004.safetensors",
1155
  "model.language_model.layers.3.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
 
1178
  "model.language_model.layers.30.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1179
  "model.language_model.layers.30.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1180
  "model.language_model.layers.30.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1181
+ "model.language_model.layers.30.self_attn.k_norm.weight": "model-missing-base.safetensors",
1182
+ "model.language_model.layers.30.self_attn.k_proj.weight": "model-missing-base.safetensors",
1183
  "model.language_model.layers.30.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1184
  "model.language_model.layers.30.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1185
  "model.language_model.layers.30.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1186
+ "model.language_model.layers.30.self_attn.v_proj.weight": "model-missing-base.safetensors",
1187
  "model.language_model.layers.31.input_layernorm.weight": "model-00003-of-00004.safetensors",
1188
  "model.language_model.layers.31.layer_scalar": "model-00003-of-00004.safetensors",
1189
  "model.language_model.layers.31.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1195
  "model.language_model.layers.31.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1196
  "model.language_model.layers.31.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1197
  "model.language_model.layers.31.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1198
+ "model.language_model.layers.31.self_attn.k_norm.weight": "model-missing-base.safetensors",
1199
+ "model.language_model.layers.31.self_attn.k_proj.weight": "model-missing-base.safetensors",
1200
  "model.language_model.layers.31.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1201
  "model.language_model.layers.31.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1202
  "model.language_model.layers.31.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1203
+ "model.language_model.layers.31.self_attn.v_proj.weight": "model-missing-base.safetensors",
1204
  "model.language_model.layers.32.input_layernorm.weight": "model-00003-of-00004.safetensors",
1205
  "model.language_model.layers.32.layer_scalar": "model-00003-of-00004.safetensors",
1206
  "model.language_model.layers.32.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1212
  "model.language_model.layers.32.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1213
  "model.language_model.layers.32.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1214
  "model.language_model.layers.32.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1215
+ "model.language_model.layers.32.self_attn.k_norm.weight": "model-missing-base.safetensors",
1216
+ "model.language_model.layers.32.self_attn.k_proj.weight": "model-missing-base.safetensors",
1217
  "model.language_model.layers.32.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1218
  "model.language_model.layers.32.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1219
  "model.language_model.layers.32.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1220
+ "model.language_model.layers.32.self_attn.v_proj.weight": "model-missing-base.safetensors",
1221
  "model.language_model.layers.33.input_layernorm.weight": "model-00003-of-00004.safetensors",
1222
  "model.language_model.layers.33.layer_scalar": "model-00003-of-00004.safetensors",
1223
  "model.language_model.layers.33.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1229
  "model.language_model.layers.33.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1230
  "model.language_model.layers.33.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1231
  "model.language_model.layers.33.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1232
+ "model.language_model.layers.33.self_attn.k_norm.weight": "model-missing-base.safetensors",
1233
+ "model.language_model.layers.33.self_attn.k_proj.weight": "model-missing-base.safetensors",
1234
  "model.language_model.layers.33.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1235
  "model.language_model.layers.33.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1236
  "model.language_model.layers.33.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1237
+ "model.language_model.layers.33.self_attn.v_proj.weight": "model-missing-base.safetensors",
1238
  "model.language_model.layers.34.input_layernorm.weight": "model-00003-of-00004.safetensors",
1239
  "model.language_model.layers.34.layer_scalar": "model-00003-of-00004.safetensors",
1240
  "model.language_model.layers.34.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1246
  "model.language_model.layers.34.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1247
  "model.language_model.layers.34.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1248
  "model.language_model.layers.34.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1249
+ "model.language_model.layers.34.self_attn.k_norm.weight": "model-missing-base.safetensors",
1250
+ "model.language_model.layers.34.self_attn.k_proj.weight": "model-missing-base.safetensors",
1251
  "model.language_model.layers.34.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1252
  "model.language_model.layers.34.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1253
  "model.language_model.layers.34.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1254
+ "model.language_model.layers.34.self_attn.v_proj.weight": "model-missing-base.safetensors",
1255
  "model.language_model.layers.35.input_layernorm.weight": "model-00003-of-00004.safetensors",
1256
  "model.language_model.layers.35.layer_scalar": "model-00003-of-00004.safetensors",
1257
  "model.language_model.layers.35.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1263
  "model.language_model.layers.35.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1264
  "model.language_model.layers.35.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1265
  "model.language_model.layers.35.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1266
+ "model.language_model.layers.35.self_attn.k_norm.weight": "model-missing-base.safetensors",
1267
+ "model.language_model.layers.35.self_attn.k_proj.weight": "model-missing-base.safetensors",
1268
  "model.language_model.layers.35.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1269
  "model.language_model.layers.35.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1270
  "model.language_model.layers.35.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1271
+ "model.language_model.layers.35.self_attn.v_proj.weight": "model-missing-base.safetensors",
1272
  "model.language_model.layers.36.input_layernorm.weight": "model-00003-of-00004.safetensors",
1273
  "model.language_model.layers.36.layer_scalar": "model-00003-of-00004.safetensors",
1274
  "model.language_model.layers.36.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1280
  "model.language_model.layers.36.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1281
  "model.language_model.layers.36.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1282
  "model.language_model.layers.36.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1283
+ "model.language_model.layers.36.self_attn.k_norm.weight": "model-missing-base.safetensors",
1284
+ "model.language_model.layers.36.self_attn.k_proj.weight": "model-missing-base.safetensors",
1285
  "model.language_model.layers.36.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1286
  "model.language_model.layers.36.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1287
  "model.language_model.layers.36.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1288
+ "model.language_model.layers.36.self_attn.v_proj.weight": "model-missing-base.safetensors",
1289
  "model.language_model.layers.37.input_layernorm.weight": "model-00003-of-00004.safetensors",
1290
  "model.language_model.layers.37.layer_scalar": "model-00003-of-00004.safetensors",
1291
  "model.language_model.layers.37.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1297
  "model.language_model.layers.37.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1298
  "model.language_model.layers.37.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1299
  "model.language_model.layers.37.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1300
+ "model.language_model.layers.37.self_attn.k_norm.weight": "model-missing-base.safetensors",
1301
+ "model.language_model.layers.37.self_attn.k_proj.weight": "model-missing-base.safetensors",
1302
  "model.language_model.layers.37.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1303
  "model.language_model.layers.37.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1304
  "model.language_model.layers.37.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1305
+ "model.language_model.layers.37.self_attn.v_proj.weight": "model-missing-base.safetensors",
1306
  "model.language_model.layers.38.input_layernorm.weight": "model-00003-of-00004.safetensors",
1307
  "model.language_model.layers.38.layer_scalar": "model-00003-of-00004.safetensors",
1308
  "model.language_model.layers.38.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1314
  "model.language_model.layers.38.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1315
  "model.language_model.layers.38.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1316
  "model.language_model.layers.38.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1317
+ "model.language_model.layers.38.self_attn.k_norm.weight": "model-missing-base.safetensors",
1318
+ "model.language_model.layers.38.self_attn.k_proj.weight": "model-missing-base.safetensors",
1319
  "model.language_model.layers.38.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1320
  "model.language_model.layers.38.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1321
  "model.language_model.layers.38.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1322
+ "model.language_model.layers.38.self_attn.v_proj.weight": "model-missing-base.safetensors",
1323
  "model.language_model.layers.39.input_layernorm.weight": "model-00003-of-00004.safetensors",
1324
  "model.language_model.layers.39.layer_scalar": "model-00003-of-00004.safetensors",
1325
  "model.language_model.layers.39.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1331
  "model.language_model.layers.39.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1332
  "model.language_model.layers.39.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1333
  "model.language_model.layers.39.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1334
+ "model.language_model.layers.39.self_attn.k_norm.weight": "model-missing-base.safetensors",
1335
+ "model.language_model.layers.39.self_attn.k_proj.weight": "model-missing-base.safetensors",
1336
  "model.language_model.layers.39.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1337
  "model.language_model.layers.39.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1338
  "model.language_model.layers.39.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1339
+ "model.language_model.layers.39.self_attn.v_proj.weight": "model-missing-base.safetensors",
1340
  "model.language_model.layers.4.input_layernorm.weight": "model-00002-of-00004.safetensors",
1341
  "model.language_model.layers.4.layer_scalar": "model-00002-of-00004.safetensors",
1342
  "model.language_model.layers.4.mlp.down_proj.weight": "model-00002-of-00004.safetensors",
 
1365
  "model.language_model.layers.40.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1366
  "model.language_model.layers.40.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1367
  "model.language_model.layers.40.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1368
+ "model.language_model.layers.40.self_attn.k_norm.weight": "model-missing-base.safetensors",
1369
+ "model.language_model.layers.40.self_attn.k_proj.weight": "model-missing-base.safetensors",
1370
  "model.language_model.layers.40.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1371
  "model.language_model.layers.40.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1372
  "model.language_model.layers.40.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1373
+ "model.language_model.layers.40.self_attn.v_proj.weight": "model-missing-base.safetensors",
1374
  "model.language_model.layers.41.input_layernorm.weight": "model-00003-of-00004.safetensors",
1375
  "model.language_model.layers.41.layer_scalar": "model-00003-of-00004.safetensors",
1376
  "model.language_model.layers.41.mlp.down_proj.weight": "model-00003-of-00004.safetensors",
 
1382
  "model.language_model.layers.41.post_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1383
  "model.language_model.layers.41.post_per_layer_input_norm.weight": "model-00003-of-00004.safetensors",
1384
  "model.language_model.layers.41.pre_feedforward_layernorm.weight": "model-00003-of-00004.safetensors",
1385
+ "model.language_model.layers.41.self_attn.k_norm.weight": "model-missing-base.safetensors",
1386
+ "model.language_model.layers.41.self_attn.k_proj.weight": "model-missing-base.safetensors",
1387
  "model.language_model.layers.41.self_attn.o_proj.weight": "model-00003-of-00004.safetensors",
1388
  "model.language_model.layers.41.self_attn.q_norm.weight": "model-00003-of-00004.safetensors",
1389
  "model.language_model.layers.41.self_attn.q_proj.weight": "model-00003-of-00004.safetensors",
1390
+ "model.language_model.layers.41.self_attn.v_proj.weight": "model-missing-base.safetensors",
1391
  "model.language_model.layers.5.input_layernorm.weight": "model-00002-of-00004.safetensors",
1392
  "model.language_model.layers.5.layer_scalar": "model-00002-of-00004.safetensors",
1393
  "model.language_model.layers.5.mlp.down_proj.weight": "model-00002-of-00004.safetensors",