{ "metadata": { "total_parameters": 21969664, "total_size": 87878656 }, "weight_map": { "encoder.1.input_proj.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.0.norm1.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.0.norm1.bias": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.0.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.0.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.0.norm2.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.0.norm2.bias": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.0.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.0.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.0.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.0.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.1.norm1.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.1.norm1.bias": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.1.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.1.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.1.norm2.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.1.norm2.bias": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.1.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.1.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.1.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.1.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.2.norm1.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.2.norm1.bias": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.2.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.2.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.2.norm2.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.2.norm2.bias": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.2.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.2.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.2.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.2.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.3.norm1.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.3.norm1.bias": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.3.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.3.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.3.norm2.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.3.norm2.bias": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.3.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.3.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.3.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.1.transformer.layers.3.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.1.output_proj.weight": "model-00001-of-00001.safetensors", "encoder.3.input_proj.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.0.norm1.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.0.norm1.bias": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.0.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.0.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.0.norm2.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.0.norm2.bias": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.0.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.0.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.0.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.0.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.1.norm1.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.1.norm1.bias": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.1.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.1.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.1.norm2.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.1.norm2.bias": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.1.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.1.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.1.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.3.transformer.layers.1.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.3.output_proj.weight": "model-00001-of-00001.safetensors", "encoder.5.input_proj.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.0.norm1.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.0.norm1.bias": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.0.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.0.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.0.norm2.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.0.norm2.bias": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.0.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.0.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.0.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.0.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.1.norm1.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.1.norm1.bias": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.1.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.1.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.1.norm2.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.1.norm2.bias": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.1.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.1.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.1.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.5.transformer.layers.1.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.5.output_proj.weight": "model-00001-of-00001.safetensors", "encoder.7.input_proj.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.0.norm1.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.0.norm1.bias": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.0.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.0.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.0.norm2.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.0.norm2.bias": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.0.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.0.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.0.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.0.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.1.norm1.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.1.norm1.bias": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.1.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.1.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.1.norm2.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.1.norm2.bias": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.1.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.1.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.1.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.1.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.2.norm1.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.2.norm1.bias": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.2.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.2.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.2.norm2.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.2.norm2.bias": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.2.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.2.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.2.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.2.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.3.norm1.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.3.norm1.bias": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.3.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.3.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.3.norm2.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.3.norm2.bias": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.3.ffn.0.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.3.ffn.2.weight": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.3.layer_scale_1.scale": "model-00001-of-00001.safetensors", "encoder.7.transformer.layers.3.layer_scale_2.scale": "model-00001-of-00001.safetensors", "encoder.7.output_proj.weight": "model-00001-of-00001.safetensors", "quantizer.input_proj.bias": "model-00001-of-00001.safetensors", "quantizer.input_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.input_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.output_proj.bias": "model-00001-of-00001.safetensors", "quantizer.output_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.output_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.0.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.0.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.0.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.0.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.0.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.0.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.0.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.1.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.1.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.1.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.1.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.1.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.1.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.1.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.2.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.2.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.2.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.2.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.2.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.2.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.2.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.3.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.3.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.3.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.3.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.3.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.3.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.3.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.4.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.4.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.4.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.4.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.4.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.4.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.4.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.5.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.5.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.5.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.5.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.5.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.5.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.5.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.6.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.6.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.6.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.6.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.6.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.6.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.6.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.7.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.7.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.7.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.7.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.7.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.7.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.7.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.8.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.8.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.8.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.8.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.8.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.8.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.8.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.9.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.9.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.9.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.9.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.9.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.9.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.9.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.10.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.10.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.10.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.10.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.10.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.10.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.10.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.11.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.11.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.11.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.11.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.11.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.11.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.11.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.12.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.12.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.12.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.12.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.12.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.12.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.12.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.13.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.13.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.13.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.13.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.13.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.13.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.13.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.14.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.14.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.14.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.14.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.14.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.14.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.14.codebook.weight": "model-00001-of-00001.safetensors", "quantizer.quantizers.15.in_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.15.in_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.15.in_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.15.out_proj.bias": "model-00001-of-00001.safetensors", "quantizer.quantizers.15.out_proj.parametrizations.weight.original0": "model-00001-of-00001.safetensors", "quantizer.quantizers.15.out_proj.parametrizations.weight.original1": "model-00001-of-00001.safetensors", "quantizer.quantizers.15.codebook.weight": "model-00001-of-00001.safetensors", "decoder.1.input_proj.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.0.norm1.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.0.norm1.bias": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.0.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.0.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.0.norm2.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.0.norm2.bias": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.0.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.0.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.0.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.0.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.1.norm1.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.1.norm1.bias": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.1.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.1.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.1.norm2.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.1.norm2.bias": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.1.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.1.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.1.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.1.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.2.norm1.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.2.norm1.bias": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.2.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.2.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.2.norm2.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.2.norm2.bias": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.2.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.2.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.2.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.2.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.3.norm1.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.3.norm1.bias": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.3.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.3.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.3.norm2.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.3.norm2.bias": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.3.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.3.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.3.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.1.transformer.layers.3.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.1.output_proj.weight": "model-00001-of-00001.safetensors", "decoder.3.input_proj.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.0.norm1.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.0.norm1.bias": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.0.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.0.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.0.norm2.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.0.norm2.bias": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.0.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.0.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.0.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.0.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.1.norm1.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.1.norm1.bias": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.1.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.1.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.1.norm2.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.1.norm2.bias": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.1.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.1.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.1.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.3.transformer.layers.1.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.3.output_proj.weight": "model-00001-of-00001.safetensors", "decoder.5.input_proj.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.0.norm1.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.0.norm1.bias": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.0.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.0.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.0.norm2.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.0.norm2.bias": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.0.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.0.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.0.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.0.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.1.norm1.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.1.norm1.bias": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.1.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.1.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.1.norm2.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.1.norm2.bias": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.1.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.1.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.1.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.5.transformer.layers.1.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.5.output_proj.weight": "model-00001-of-00001.safetensors", "decoder.7.input_proj.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.0.norm1.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.0.norm1.bias": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.0.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.0.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.0.norm2.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.0.norm2.bias": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.0.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.0.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.0.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.0.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.1.norm1.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.1.norm1.bias": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.1.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.1.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.1.norm2.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.1.norm2.bias": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.1.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.1.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.1.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.1.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.2.norm1.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.2.norm1.bias": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.2.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.2.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.2.norm2.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.2.norm2.bias": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.2.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.2.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.2.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.2.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.3.norm1.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.3.norm1.bias": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.3.self_attn.in_proj.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.3.self_attn.out_proj.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.3.norm2.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.3.norm2.bias": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.3.ffn.0.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.3.ffn.2.weight": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.3.layer_scale_1.scale": "model-00001-of-00001.safetensors", "decoder.7.transformer.layers.3.layer_scale_2.scale": "model-00001-of-00001.safetensors", "decoder.7.output_proj.weight": "model-00001-of-00001.safetensors" } }