{ "metadata": { "total_size": 4716536288, "total_parameters": 4002337008 }, "weight_map": { "acoustic_transformer.acoustic_codebook_output.weight": "model.safetensors", "acoustic_transformer.input_projection.weight": "model.safetensors", "acoustic_transformer.layers.0.attention.wk.scales": "model.safetensors", "acoustic_transformer.layers.0.attention.wk.weight": "model.safetensors", "acoustic_transformer.layers.0.attention.wo.scales": "model.safetensors", "acoustic_transformer.layers.0.attention.wo.weight": "model.safetensors", "acoustic_transformer.layers.0.attention.wq.scales": "model.safetensors", "acoustic_transformer.layers.0.attention.wq.weight": "model.safetensors", "acoustic_transformer.layers.0.attention.wv.scales": "model.safetensors", "acoustic_transformer.layers.0.attention.wv.weight": "model.safetensors", "acoustic_transformer.layers.0.attention_norm.weight": "model.safetensors", "acoustic_transformer.layers.0.feed_forward_w1.scales": "model.safetensors", "acoustic_transformer.layers.0.feed_forward_w1.weight": "model.safetensors", "acoustic_transformer.layers.0.feed_forward_w2.scales": "model.safetensors", "acoustic_transformer.layers.0.feed_forward_w2.weight": "model.safetensors", "acoustic_transformer.layers.0.feed_forward_w3.scales": "model.safetensors", "acoustic_transformer.layers.0.feed_forward_w3.weight": "model.safetensors", "acoustic_transformer.layers.0.ffn_norm.weight": "model.safetensors", "acoustic_transformer.layers.1.attention.wk.scales": "model.safetensors", "acoustic_transformer.layers.1.attention.wk.weight": "model.safetensors", "acoustic_transformer.layers.1.attention.wo.scales": "model.safetensors", "acoustic_transformer.layers.1.attention.wo.weight": "model.safetensors", "acoustic_transformer.layers.1.attention.wq.scales": "model.safetensors", "acoustic_transformer.layers.1.attention.wq.weight": "model.safetensors", "acoustic_transformer.layers.1.attention.wv.scales": "model.safetensors", "acoustic_transformer.layers.1.attention.wv.weight": "model.safetensors", "acoustic_transformer.layers.1.attention_norm.weight": "model.safetensors", "acoustic_transformer.layers.1.feed_forward_w1.scales": "model.safetensors", "acoustic_transformer.layers.1.feed_forward_w1.weight": "model.safetensors", "acoustic_transformer.layers.1.feed_forward_w2.scales": "model.safetensors", "acoustic_transformer.layers.1.feed_forward_w2.weight": "model.safetensors", "acoustic_transformer.layers.1.feed_forward_w3.scales": "model.safetensors", "acoustic_transformer.layers.1.feed_forward_w3.weight": "model.safetensors", "acoustic_transformer.layers.1.ffn_norm.weight": "model.safetensors", "acoustic_transformer.layers.2.attention.wk.scales": "model.safetensors", "acoustic_transformer.layers.2.attention.wk.weight": "model.safetensors", "acoustic_transformer.layers.2.attention.wo.scales": "model.safetensors", "acoustic_transformer.layers.2.attention.wo.weight": "model.safetensors", "acoustic_transformer.layers.2.attention.wq.scales": "model.safetensors", "acoustic_transformer.layers.2.attention.wq.weight": "model.safetensors", "acoustic_transformer.layers.2.attention.wv.scales": "model.safetensors", "acoustic_transformer.layers.2.attention.wv.weight": "model.safetensors", "acoustic_transformer.layers.2.attention_norm.weight": "model.safetensors", "acoustic_transformer.layers.2.feed_forward_w1.scales": "model.safetensors", "acoustic_transformer.layers.2.feed_forward_w1.weight": "model.safetensors", "acoustic_transformer.layers.2.feed_forward_w2.scales": "model.safetensors", "acoustic_transformer.layers.2.feed_forward_w2.weight": "model.safetensors", "acoustic_transformer.layers.2.feed_forward_w3.scales": "model.safetensors", "acoustic_transformer.layers.2.feed_forward_w3.weight": "model.safetensors", "acoustic_transformer.layers.2.ffn_norm.weight": "model.safetensors", "acoustic_transformer.llm_projection.scales": "model.safetensors", "acoustic_transformer.llm_projection.weight": "model.safetensors", "acoustic_transformer.norm.weight": "model.safetensors", "acoustic_transformer.semantic_codebook_output.weight": "model.safetensors", "acoustic_transformer.time_projection.scales": "model.safetensors", "acoustic_transformer.time_projection.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.0.conv.original0": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.0.conv.original1": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.attention.k_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.attention.q_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.attention.wk.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.attention.wo.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.attention.wq.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.attention.wv.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.attention_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.attention_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.feed_forward_w1.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.feed_forward_w2.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.feed_forward_w3.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.ffn_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.0.ffn_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.attention.k_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.attention.q_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.attention.wk.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.attention.wo.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.attention.wq.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.attention.wv.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.attention_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.attention_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.feed_forward_w1.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.feed_forward_w2.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.feed_forward_w3.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.ffn_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.1.layers.1.ffn_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.2.conv.original0": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.2.conv.original1": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.attention.k_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.attention.q_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.attention.wk.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.attention.wo.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.attention.wq.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.attention.wv.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.attention_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.attention_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.feed_forward_w1.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.feed_forward_w2.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.feed_forward_w3.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.ffn_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.0.ffn_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.attention.k_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.attention.q_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.attention.wk.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.attention.wo.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.attention.wq.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.attention.wv.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.attention_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.attention_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.feed_forward_w1.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.feed_forward_w2.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.feed_forward_w3.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.ffn_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.3.layers.1.ffn_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.4.conv.original0": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.4.conv.original1": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.attention.k_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.attention.q_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.attention.wk.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.attention.wo.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.attention.wq.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.attention.wv.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.attention_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.attention_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.feed_forward_w1.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.feed_forward_w2.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.feed_forward_w3.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.ffn_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.0.ffn_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.attention.k_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.attention.q_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.attention.wk.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.attention.wo.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.attention.wq.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.attention.wv.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.attention_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.attention_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.feed_forward_w1.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.feed_forward_w2.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.feed_forward_w3.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.ffn_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.5.layers.1.ffn_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.6.conv.original0": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.6.conv.original1": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.attention.k_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.attention.q_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.attention.wk.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.attention.wo.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.attention.wq.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.attention.wv.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.attention_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.attention_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.feed_forward_w1.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.feed_forward_w2.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.feed_forward_w3.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.ffn_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.0.ffn_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.attention.k_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.attention.q_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.attention.wk.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.attention.wo.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.attention.wq.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.attention.wv.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.attention_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.attention_scale": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.feed_forward_w1.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.feed_forward_w2.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.feed_forward_w3.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.ffn_norm.weight": "model.safetensors", "audio_tokenizer_decoder.decoder_blocks.7.layers.1.ffn_scale": "model.safetensors", "audio_tokenizer_decoder.output_proj.conv.original0": "model.safetensors", "audio_tokenizer_decoder.output_proj.conv.original1": "model.safetensors", "audio_tokenizer_decoder.quantizer_semantic_codebook.cluster_usage": "model.safetensors", "audio_tokenizer_decoder.quantizer_semantic_codebook.embedding_sum": "model.safetensors", "llm.audio_codebook_embeddings.weight": "model.safetensors", "llm.layers.0.attention.wk.scales": "model.safetensors", "llm.layers.0.attention.wk.weight": "model.safetensors", "llm.layers.0.attention.wo.scales": "model.safetensors", "llm.layers.0.attention.wo.weight": "model.safetensors", "llm.layers.0.attention.wq.scales": "model.safetensors", "llm.layers.0.attention.wq.weight": "model.safetensors", "llm.layers.0.attention.wv.scales": "model.safetensors", "llm.layers.0.attention.wv.weight": "model.safetensors", "llm.layers.0.attention_norm.weight": "model.safetensors", "llm.layers.0.feed_forward_w1.scales": "model.safetensors", "llm.layers.0.feed_forward_w1.weight": "model.safetensors", "llm.layers.0.feed_forward_w2.scales": "model.safetensors", "llm.layers.0.feed_forward_w2.weight": "model.safetensors", "llm.layers.0.feed_forward_w3.scales": "model.safetensors", "llm.layers.0.feed_forward_w3.weight": "model.safetensors", "llm.layers.0.ffn_norm.weight": "model.safetensors", "llm.layers.1.attention.wk.scales": "model.safetensors", "llm.layers.1.attention.wk.weight": "model.safetensors", "llm.layers.1.attention.wo.scales": "model.safetensors", "llm.layers.1.attention.wo.weight": "model.safetensors", "llm.layers.1.attention.wq.scales": "model.safetensors", "llm.layers.1.attention.wq.weight": "model.safetensors", "llm.layers.1.attention.wv.scales": "model.safetensors", "llm.layers.1.attention.wv.weight": "model.safetensors", "llm.layers.1.attention_norm.weight": "model.safetensors", "llm.layers.1.feed_forward_w1.scales": "model.safetensors", "llm.layers.1.feed_forward_w1.weight": "model.safetensors", "llm.layers.1.feed_forward_w2.scales": "model.safetensors", "llm.layers.1.feed_forward_w2.weight": "model.safetensors", "llm.layers.1.feed_forward_w3.scales": "model.safetensors", "llm.layers.1.feed_forward_w3.weight": "model.safetensors", "llm.layers.1.ffn_norm.weight": "model.safetensors", "llm.layers.10.attention.wk.scales": "model.safetensors", "llm.layers.10.attention.wk.weight": "model.safetensors", "llm.layers.10.attention.wo.scales": "model.safetensors", "llm.layers.10.attention.wo.weight": "model.safetensors", "llm.layers.10.attention.wq.scales": "model.safetensors", "llm.layers.10.attention.wq.weight": "model.safetensors", "llm.layers.10.attention.wv.scales": "model.safetensors", "llm.layers.10.attention.wv.weight": "model.safetensors", "llm.layers.10.attention_norm.weight": "model.safetensors", "llm.layers.10.feed_forward_w1.scales": "model.safetensors", "llm.layers.10.feed_forward_w1.weight": "model.safetensors", "llm.layers.10.feed_forward_w2.scales": "model.safetensors", "llm.layers.10.feed_forward_w2.weight": "model.safetensors", "llm.layers.10.feed_forward_w3.scales": "model.safetensors", "llm.layers.10.feed_forward_w3.weight": "model.safetensors", "llm.layers.10.ffn_norm.weight": "model.safetensors", "llm.layers.11.attention.wk.scales": "model.safetensors", "llm.layers.11.attention.wk.weight": "model.safetensors", "llm.layers.11.attention.wo.scales": "model.safetensors", "llm.layers.11.attention.wo.weight": "model.safetensors", "llm.layers.11.attention.wq.scales": "model.safetensors", "llm.layers.11.attention.wq.weight": "model.safetensors", "llm.layers.11.attention.wv.scales": "model.safetensors", "llm.layers.11.attention.wv.weight": "model.safetensors", "llm.layers.11.attention_norm.weight": "model.safetensors", "llm.layers.11.feed_forward_w1.scales": "model.safetensors", "llm.layers.11.feed_forward_w1.weight": "model.safetensors", "llm.layers.11.feed_forward_w2.scales": "model.safetensors", "llm.layers.11.feed_forward_w2.weight": "model.safetensors", "llm.layers.11.feed_forward_w3.scales": "model.safetensors", "llm.layers.11.feed_forward_w3.weight": "model.safetensors", "llm.layers.11.ffn_norm.weight": "model.safetensors", "llm.layers.12.attention.wk.scales": "model.safetensors", "llm.layers.12.attention.wk.weight": "model.safetensors", "llm.layers.12.attention.wo.scales": "model.safetensors", "llm.layers.12.attention.wo.weight": "model.safetensors", "llm.layers.12.attention.wq.scales": "model.safetensors", "llm.layers.12.attention.wq.weight": "model.safetensors", "llm.layers.12.attention.wv.scales": "model.safetensors", "llm.layers.12.attention.wv.weight": "model.safetensors", "llm.layers.12.attention_norm.weight": "model.safetensors", "llm.layers.12.feed_forward_w1.scales": "model.safetensors", "llm.layers.12.feed_forward_w1.weight": "model.safetensors", "llm.layers.12.feed_forward_w2.scales": "model.safetensors", "llm.layers.12.feed_forward_w2.weight": "model.safetensors", "llm.layers.12.feed_forward_w3.scales": "model.safetensors", "llm.layers.12.feed_forward_w3.weight": "model.safetensors", "llm.layers.12.ffn_norm.weight": "model.safetensors", "llm.layers.13.attention.wk.scales": "model.safetensors", "llm.layers.13.attention.wk.weight": "model.safetensors", "llm.layers.13.attention.wo.scales": "model.safetensors", "llm.layers.13.attention.wo.weight": "model.safetensors", "llm.layers.13.attention.wq.scales": "model.safetensors", "llm.layers.13.attention.wq.weight": "model.safetensors", "llm.layers.13.attention.wv.scales": "model.safetensors", "llm.layers.13.attention.wv.weight": "model.safetensors", "llm.layers.13.attention_norm.weight": "model.safetensors", "llm.layers.13.feed_forward_w1.scales": "model.safetensors", "llm.layers.13.feed_forward_w1.weight": "model.safetensors", "llm.layers.13.feed_forward_w2.scales": "model.safetensors", "llm.layers.13.feed_forward_w2.weight": "model.safetensors", "llm.layers.13.feed_forward_w3.scales": "model.safetensors", "llm.layers.13.feed_forward_w3.weight": "model.safetensors", "llm.layers.13.ffn_norm.weight": "model.safetensors", "llm.layers.14.attention.wk.scales": "model.safetensors", "llm.layers.14.attention.wk.weight": "model.safetensors", "llm.layers.14.attention.wo.scales": "model.safetensors", "llm.layers.14.attention.wo.weight": "model.safetensors", "llm.layers.14.attention.wq.scales": "model.safetensors", "llm.layers.14.attention.wq.weight": "model.safetensors", "llm.layers.14.attention.wv.scales": "model.safetensors", "llm.layers.14.attention.wv.weight": "model.safetensors", "llm.layers.14.attention_norm.weight": "model.safetensors", "llm.layers.14.feed_forward_w1.scales": "model.safetensors", "llm.layers.14.feed_forward_w1.weight": "model.safetensors", "llm.layers.14.feed_forward_w2.scales": "model.safetensors", "llm.layers.14.feed_forward_w2.weight": "model.safetensors", "llm.layers.14.feed_forward_w3.scales": "model.safetensors", "llm.layers.14.feed_forward_w3.weight": "model.safetensors", "llm.layers.14.ffn_norm.weight": "model.safetensors", "llm.layers.15.attention.wk.scales": "model.safetensors", "llm.layers.15.attention.wk.weight": "model.safetensors", "llm.layers.15.attention.wo.scales": "model.safetensors", "llm.layers.15.attention.wo.weight": "model.safetensors", "llm.layers.15.attention.wq.scales": "model.safetensors", "llm.layers.15.attention.wq.weight": "model.safetensors", "llm.layers.15.attention.wv.scales": "model.safetensors", "llm.layers.15.attention.wv.weight": "model.safetensors", "llm.layers.15.attention_norm.weight": "model.safetensors", "llm.layers.15.feed_forward_w1.scales": "model.safetensors", "llm.layers.15.feed_forward_w1.weight": "model.safetensors", "llm.layers.15.feed_forward_w2.scales": "model.safetensors", "llm.layers.15.feed_forward_w2.weight": "model.safetensors", "llm.layers.15.feed_forward_w3.scales": "model.safetensors", "llm.layers.15.feed_forward_w3.weight": "model.safetensors", "llm.layers.15.ffn_norm.weight": "model.safetensors", "llm.layers.16.attention.wk.scales": "model.safetensors", "llm.layers.16.attention.wk.weight": "model.safetensors", "llm.layers.16.attention.wo.scales": "model.safetensors", "llm.layers.16.attention.wo.weight": "model.safetensors", "llm.layers.16.attention.wq.scales": "model.safetensors", "llm.layers.16.attention.wq.weight": "model.safetensors", "llm.layers.16.attention.wv.scales": "model.safetensors", "llm.layers.16.attention.wv.weight": "model.safetensors", "llm.layers.16.attention_norm.weight": "model.safetensors", "llm.layers.16.feed_forward_w1.scales": "model.safetensors", "llm.layers.16.feed_forward_w1.weight": "model.safetensors", "llm.layers.16.feed_forward_w2.scales": "model.safetensors", "llm.layers.16.feed_forward_w2.weight": "model.safetensors", "llm.layers.16.feed_forward_w3.scales": "model.safetensors", "llm.layers.16.feed_forward_w3.weight": "model.safetensors", "llm.layers.16.ffn_norm.weight": "model.safetensors", "llm.layers.17.attention.wk.scales": "model.safetensors", "llm.layers.17.attention.wk.weight": "model.safetensors", "llm.layers.17.attention.wo.scales": "model.safetensors", "llm.layers.17.attention.wo.weight": "model.safetensors", "llm.layers.17.attention.wq.scales": "model.safetensors", "llm.layers.17.attention.wq.weight": "model.safetensors", "llm.layers.17.attention.wv.scales": "model.safetensors", "llm.layers.17.attention.wv.weight": "model.safetensors", "llm.layers.17.attention_norm.weight": "model.safetensors", "llm.layers.17.feed_forward_w1.scales": "model.safetensors", "llm.layers.17.feed_forward_w1.weight": "model.safetensors", "llm.layers.17.feed_forward_w2.scales": "model.safetensors", "llm.layers.17.feed_forward_w2.weight": "model.safetensors", "llm.layers.17.feed_forward_w3.scales": "model.safetensors", "llm.layers.17.feed_forward_w3.weight": "model.safetensors", "llm.layers.17.ffn_norm.weight": "model.safetensors", "llm.layers.18.attention.wk.scales": "model.safetensors", "llm.layers.18.attention.wk.weight": "model.safetensors", "llm.layers.18.attention.wo.scales": "model.safetensors", "llm.layers.18.attention.wo.weight": "model.safetensors", "llm.layers.18.attention.wq.scales": "model.safetensors", "llm.layers.18.attention.wq.weight": "model.safetensors", "llm.layers.18.attention.wv.scales": "model.safetensors", "llm.layers.18.attention.wv.weight": "model.safetensors", "llm.layers.18.attention_norm.weight": "model.safetensors", "llm.layers.18.feed_forward_w1.scales": "model.safetensors", "llm.layers.18.feed_forward_w1.weight": "model.safetensors", "llm.layers.18.feed_forward_w2.scales": "model.safetensors", "llm.layers.18.feed_forward_w2.weight": "model.safetensors", "llm.layers.18.feed_forward_w3.scales": "model.safetensors", "llm.layers.18.feed_forward_w3.weight": "model.safetensors", "llm.layers.18.ffn_norm.weight": "model.safetensors", "llm.layers.19.attention.wk.scales": "model.safetensors", "llm.layers.19.attention.wk.weight": "model.safetensors", "llm.layers.19.attention.wo.scales": "model.safetensors", "llm.layers.19.attention.wo.weight": "model.safetensors", "llm.layers.19.attention.wq.scales": "model.safetensors", "llm.layers.19.attention.wq.weight": "model.safetensors", "llm.layers.19.attention.wv.scales": "model.safetensors", "llm.layers.19.attention.wv.weight": "model.safetensors", "llm.layers.19.attention_norm.weight": "model.safetensors", "llm.layers.19.feed_forward_w1.scales": "model.safetensors", "llm.layers.19.feed_forward_w1.weight": "model.safetensors", "llm.layers.19.feed_forward_w2.scales": "model.safetensors", "llm.layers.19.feed_forward_w2.weight": "model.safetensors", "llm.layers.19.feed_forward_w3.scales": "model.safetensors", "llm.layers.19.feed_forward_w3.weight": "model.safetensors", "llm.layers.19.ffn_norm.weight": "model.safetensors", "llm.layers.2.attention.wk.scales": "model.safetensors", "llm.layers.2.attention.wk.weight": "model.safetensors", "llm.layers.2.attention.wo.scales": "model.safetensors", "llm.layers.2.attention.wo.weight": "model.safetensors", "llm.layers.2.attention.wq.scales": "model.safetensors", "llm.layers.2.attention.wq.weight": "model.safetensors", "llm.layers.2.attention.wv.scales": "model.safetensors", "llm.layers.2.attention.wv.weight": "model.safetensors", "llm.layers.2.attention_norm.weight": "model.safetensors", "llm.layers.2.feed_forward_w1.scales": "model.safetensors", "llm.layers.2.feed_forward_w1.weight": "model.safetensors", "llm.layers.2.feed_forward_w2.scales": "model.safetensors", "llm.layers.2.feed_forward_w2.weight": "model.safetensors", "llm.layers.2.feed_forward_w3.scales": "model.safetensors", "llm.layers.2.feed_forward_w3.weight": "model.safetensors", "llm.layers.2.ffn_norm.weight": "model.safetensors", "llm.layers.20.attention.wk.scales": "model.safetensors", "llm.layers.20.attention.wk.weight": "model.safetensors", "llm.layers.20.attention.wo.scales": "model.safetensors", "llm.layers.20.attention.wo.weight": "model.safetensors", "llm.layers.20.attention.wq.scales": "model.safetensors", "llm.layers.20.attention.wq.weight": "model.safetensors", "llm.layers.20.attention.wv.scales": "model.safetensors", "llm.layers.20.attention.wv.weight": "model.safetensors", "llm.layers.20.attention_norm.weight": "model.safetensors", "llm.layers.20.feed_forward_w1.scales": "model.safetensors", "llm.layers.20.feed_forward_w1.weight": "model.safetensors", "llm.layers.20.feed_forward_w2.scales": "model.safetensors", "llm.layers.20.feed_forward_w2.weight": "model.safetensors", "llm.layers.20.feed_forward_w3.scales": "model.safetensors", "llm.layers.20.feed_forward_w3.weight": "model.safetensors", "llm.layers.20.ffn_norm.weight": "model.safetensors", "llm.layers.21.attention.wk.scales": "model.safetensors", "llm.layers.21.attention.wk.weight": "model.safetensors", "llm.layers.21.attention.wo.scales": "model.safetensors", "llm.layers.21.attention.wo.weight": "model.safetensors", "llm.layers.21.attention.wq.scales": "model.safetensors", "llm.layers.21.attention.wq.weight": "model.safetensors", "llm.layers.21.attention.wv.scales": "model.safetensors", "llm.layers.21.attention.wv.weight": "model.safetensors", "llm.layers.21.attention_norm.weight": "model.safetensors", "llm.layers.21.feed_forward_w1.scales": "model.safetensors", "llm.layers.21.feed_forward_w1.weight": "model.safetensors", "llm.layers.21.feed_forward_w2.scales": "model.safetensors", "llm.layers.21.feed_forward_w2.weight": "model.safetensors", "llm.layers.21.feed_forward_w3.scales": "model.safetensors", "llm.layers.21.feed_forward_w3.weight": "model.safetensors", "llm.layers.21.ffn_norm.weight": "model.safetensors", "llm.layers.22.attention.wk.scales": "model.safetensors", "llm.layers.22.attention.wk.weight": "model.safetensors", "llm.layers.22.attention.wo.scales": "model.safetensors", "llm.layers.22.attention.wo.weight": "model.safetensors", "llm.layers.22.attention.wq.scales": "model.safetensors", "llm.layers.22.attention.wq.weight": "model.safetensors", "llm.layers.22.attention.wv.scales": "model.safetensors", "llm.layers.22.attention.wv.weight": "model.safetensors", "llm.layers.22.attention_norm.weight": "model.safetensors", "llm.layers.22.feed_forward_w1.scales": "model.safetensors", "llm.layers.22.feed_forward_w1.weight": "model.safetensors", "llm.layers.22.feed_forward_w2.scales": "model.safetensors", "llm.layers.22.feed_forward_w2.weight": "model.safetensors", "llm.layers.22.feed_forward_w3.scales": "model.safetensors", "llm.layers.22.feed_forward_w3.weight": "model.safetensors", "llm.layers.22.ffn_norm.weight": "model.safetensors", "llm.layers.23.attention.wk.scales": "model.safetensors", "llm.layers.23.attention.wk.weight": "model.safetensors", "llm.layers.23.attention.wo.scales": "model.safetensors", "llm.layers.23.attention.wo.weight": "model.safetensors", "llm.layers.23.attention.wq.scales": "model.safetensors", "llm.layers.23.attention.wq.weight": "model.safetensors", "llm.layers.23.attention.wv.scales": "model.safetensors", "llm.layers.23.attention.wv.weight": "model.safetensors", "llm.layers.23.attention_norm.weight": "model.safetensors", "llm.layers.23.feed_forward_w1.scales": "model.safetensors", "llm.layers.23.feed_forward_w1.weight": "model.safetensors", "llm.layers.23.feed_forward_w2.scales": "model.safetensors", "llm.layers.23.feed_forward_w2.weight": "model.safetensors", "llm.layers.23.feed_forward_w3.scales": "model.safetensors", "llm.layers.23.feed_forward_w3.weight": "model.safetensors", "llm.layers.23.ffn_norm.weight": "model.safetensors", "llm.layers.24.attention.wk.scales": "model.safetensors", "llm.layers.24.attention.wk.weight": "model.safetensors", "llm.layers.24.attention.wo.scales": "model.safetensors", "llm.layers.24.attention.wo.weight": "model.safetensors", "llm.layers.24.attention.wq.scales": "model.safetensors", "llm.layers.24.attention.wq.weight": "model.safetensors", "llm.layers.24.attention.wv.scales": "model.safetensors", "llm.layers.24.attention.wv.weight": "model.safetensors", "llm.layers.24.attention_norm.weight": "model.safetensors", "llm.layers.24.feed_forward_w1.scales": "model.safetensors", "llm.layers.24.feed_forward_w1.weight": "model.safetensors", "llm.layers.24.feed_forward_w2.scales": "model.safetensors", "llm.layers.24.feed_forward_w2.weight": "model.safetensors", "llm.layers.24.feed_forward_w3.scales": "model.safetensors", "llm.layers.24.feed_forward_w3.weight": "model.safetensors", "llm.layers.24.ffn_norm.weight": "model.safetensors", "llm.layers.25.attention.wk.scales": "model.safetensors", "llm.layers.25.attention.wk.weight": "model.safetensors", "llm.layers.25.attention.wo.scales": "model.safetensors", "llm.layers.25.attention.wo.weight": "model.safetensors", "llm.layers.25.attention.wq.scales": "model.safetensors", "llm.layers.25.attention.wq.weight": "model.safetensors", "llm.layers.25.attention.wv.scales": "model.safetensors", "llm.layers.25.attention.wv.weight": "model.safetensors", "llm.layers.25.attention_norm.weight": "model.safetensors", "llm.layers.25.feed_forward_w1.scales": "model.safetensors", "llm.layers.25.feed_forward_w1.weight": "model.safetensors", "llm.layers.25.feed_forward_w2.scales": "model.safetensors", "llm.layers.25.feed_forward_w2.weight": "model.safetensors", "llm.layers.25.feed_forward_w3.scales": "model.safetensors", "llm.layers.25.feed_forward_w3.weight": "model.safetensors", "llm.layers.25.ffn_norm.weight": "model.safetensors", "llm.layers.3.attention.wk.scales": "model.safetensors", "llm.layers.3.attention.wk.weight": "model.safetensors", "llm.layers.3.attention.wo.scales": "model.safetensors", "llm.layers.3.attention.wo.weight": "model.safetensors", "llm.layers.3.attention.wq.scales": "model.safetensors", "llm.layers.3.attention.wq.weight": "model.safetensors", "llm.layers.3.attention.wv.scales": "model.safetensors", "llm.layers.3.attention.wv.weight": "model.safetensors", "llm.layers.3.attention_norm.weight": "model.safetensors", "llm.layers.3.feed_forward_w1.scales": "model.safetensors", "llm.layers.3.feed_forward_w1.weight": "model.safetensors", "llm.layers.3.feed_forward_w2.scales": "model.safetensors", "llm.layers.3.feed_forward_w2.weight": "model.safetensors", "llm.layers.3.feed_forward_w3.scales": "model.safetensors", "llm.layers.3.feed_forward_w3.weight": "model.safetensors", "llm.layers.3.ffn_norm.weight": "model.safetensors", "llm.layers.4.attention.wk.scales": "model.safetensors", "llm.layers.4.attention.wk.weight": "model.safetensors", "llm.layers.4.attention.wo.scales": "model.safetensors", "llm.layers.4.attention.wo.weight": "model.safetensors", "llm.layers.4.attention.wq.scales": "model.safetensors", "llm.layers.4.attention.wq.weight": "model.safetensors", "llm.layers.4.attention.wv.scales": "model.safetensors", "llm.layers.4.attention.wv.weight": "model.safetensors", "llm.layers.4.attention_norm.weight": "model.safetensors", "llm.layers.4.feed_forward_w1.scales": "model.safetensors", "llm.layers.4.feed_forward_w1.weight": "model.safetensors", "llm.layers.4.feed_forward_w2.scales": "model.safetensors", "llm.layers.4.feed_forward_w2.weight": "model.safetensors", "llm.layers.4.feed_forward_w3.scales": "model.safetensors", "llm.layers.4.feed_forward_w3.weight": "model.safetensors", "llm.layers.4.ffn_norm.weight": "model.safetensors", "llm.layers.5.attention.wk.scales": "model.safetensors", "llm.layers.5.attention.wk.weight": "model.safetensors", "llm.layers.5.attention.wo.scales": "model.safetensors", "llm.layers.5.attention.wo.weight": "model.safetensors", "llm.layers.5.attention.wq.scales": "model.safetensors", "llm.layers.5.attention.wq.weight": "model.safetensors", "llm.layers.5.attention.wv.scales": "model.safetensors", "llm.layers.5.attention.wv.weight": "model.safetensors", "llm.layers.5.attention_norm.weight": "model.safetensors", "llm.layers.5.feed_forward_w1.scales": "model.safetensors", "llm.layers.5.feed_forward_w1.weight": "model.safetensors", "llm.layers.5.feed_forward_w2.scales": "model.safetensors", "llm.layers.5.feed_forward_w2.weight": "model.safetensors", "llm.layers.5.feed_forward_w3.scales": "model.safetensors", "llm.layers.5.feed_forward_w3.weight": "model.safetensors", "llm.layers.5.ffn_norm.weight": "model.safetensors", "llm.layers.6.attention.wk.scales": "model.safetensors", "llm.layers.6.attention.wk.weight": "model.safetensors", "llm.layers.6.attention.wo.scales": "model.safetensors", "llm.layers.6.attention.wo.weight": "model.safetensors", "llm.layers.6.attention.wq.scales": "model.safetensors", "llm.layers.6.attention.wq.weight": "model.safetensors", "llm.layers.6.attention.wv.scales": "model.safetensors", "llm.layers.6.attention.wv.weight": "model.safetensors", "llm.layers.6.attention_norm.weight": "model.safetensors", "llm.layers.6.feed_forward_w1.scales": "model.safetensors", "llm.layers.6.feed_forward_w1.weight": "model.safetensors", "llm.layers.6.feed_forward_w2.scales": "model.safetensors", "llm.layers.6.feed_forward_w2.weight": "model.safetensors", "llm.layers.6.feed_forward_w3.scales": "model.safetensors", "llm.layers.6.feed_forward_w3.weight": "model.safetensors", "llm.layers.6.ffn_norm.weight": "model.safetensors", "llm.layers.7.attention.wk.scales": "model.safetensors", "llm.layers.7.attention.wk.weight": "model.safetensors", "llm.layers.7.attention.wo.scales": "model.safetensors", "llm.layers.7.attention.wo.weight": "model.safetensors", "llm.layers.7.attention.wq.scales": "model.safetensors", "llm.layers.7.attention.wq.weight": "model.safetensors", "llm.layers.7.attention.wv.scales": "model.safetensors", "llm.layers.7.attention.wv.weight": "model.safetensors", "llm.layers.7.attention_norm.weight": "model.safetensors", "llm.layers.7.feed_forward_w1.scales": "model.safetensors", "llm.layers.7.feed_forward_w1.weight": "model.safetensors", "llm.layers.7.feed_forward_w2.scales": "model.safetensors", "llm.layers.7.feed_forward_w2.weight": "model.safetensors", "llm.layers.7.feed_forward_w3.scales": "model.safetensors", "llm.layers.7.feed_forward_w3.weight": "model.safetensors", "llm.layers.7.ffn_norm.weight": "model.safetensors", "llm.layers.8.attention.wk.scales": "model.safetensors", "llm.layers.8.attention.wk.weight": "model.safetensors", "llm.layers.8.attention.wo.scales": "model.safetensors", "llm.layers.8.attention.wo.weight": "model.safetensors", "llm.layers.8.attention.wq.scales": "model.safetensors", "llm.layers.8.attention.wq.weight": "model.safetensors", "llm.layers.8.attention.wv.scales": "model.safetensors", "llm.layers.8.attention.wv.weight": "model.safetensors", "llm.layers.8.attention_norm.weight": "model.safetensors", "llm.layers.8.feed_forward_w1.scales": "model.safetensors", "llm.layers.8.feed_forward_w1.weight": "model.safetensors", "llm.layers.8.feed_forward_w2.scales": "model.safetensors", "llm.layers.8.feed_forward_w2.weight": "model.safetensors", "llm.layers.8.feed_forward_w3.scales": "model.safetensors", "llm.layers.8.feed_forward_w3.weight": "model.safetensors", "llm.layers.8.ffn_norm.weight": "model.safetensors", "llm.layers.9.attention.wk.scales": "model.safetensors", "llm.layers.9.attention.wk.weight": "model.safetensors", "llm.layers.9.attention.wo.scales": "model.safetensors", "llm.layers.9.attention.wo.weight": "model.safetensors", "llm.layers.9.attention.wq.scales": "model.safetensors", "llm.layers.9.attention.wq.weight": "model.safetensors", "llm.layers.9.attention.wv.scales": "model.safetensors", "llm.layers.9.attention.wv.weight": "model.safetensors", "llm.layers.9.attention_norm.weight": "model.safetensors", "llm.layers.9.feed_forward_w1.scales": "model.safetensors", "llm.layers.9.feed_forward_w1.weight": "model.safetensors", "llm.layers.9.feed_forward_w2.scales": "model.safetensors", "llm.layers.9.feed_forward_w2.weight": "model.safetensors", "llm.layers.9.feed_forward_w3.scales": "model.safetensors", "llm.layers.9.feed_forward_w3.weight": "model.safetensors", "llm.layers.9.ffn_norm.weight": "model.safetensors", "llm.norm.weight": "model.safetensors", "llm.tok_embeddings.weight": "model.safetensors" } }