{ "base": { "dir": "~/AI/local_models_exl/glm-4.6-exl3-4bpw", "bpw": 4.015793627432631 }, "alts": [ { "dir": "~/AI/local_models_exl/glm-4.6-exl3-5bpw", "bpw": 5.015586054132434 }, { "dir": "~/AI/local_models_exl/glm-4.6-exl3-6bpw", "bpw": 6.015378480832238 } ], "groups": [ { "idx": 0, "layers": [ "model.layers.0.self_attn.q_proj" ], "candidates": [ { "dkld": -2.5164801627397537e-05, "dbits": 62914560 }, { "dkld": 1.8384424038231373e-05, "dbits": 125829120 } ] }, { "idx": 1, "layers": [ "model.layers.0.self_attn.k_proj", "model.layers.0.self_attn.v_proj" ], "candidates": [ { "dkld": 1.4285696670413364e-05, "dbits": 10485760 }, { "dkld": -3.289827145636082e-05, "dbits": 20971520 } ] }, { "idx": 2, "layers": [ "model.layers.0.self_attn.o_proj" ], "candidates": [ { "dkld": 4.898635670542821e-05, "dbits": 62914560 }, { "dkld": 7.211375050246785e-05, "dbits": 125829120 } ] }, { "idx": 3, "layers": [ "model.layers.0.mlp.gate_proj", "model.layers.0.mlp.up_proj" ], "candidates": [ { "dkld": -9.173848666250636e-05, "dbits": 125829120 }, { "dkld": -2.436479553580284e-05, "dbits": 251658240 } ] }, { "idx": 4, "layers": [ "model.layers.0.mlp.down_proj" ], "candidates": [ { "dkld": -7.209992036223342e-05, "dbits": 62914560 }, { "dkld": -2.96549173071977e-05, "dbits": 125829120 } ] }, { "idx": 5, "layers": [ "model.layers.1.self_attn.q_proj" ], "candidates": [ { "dkld": -4.123151302336953e-06, "dbits": 62914560 }, { "dkld": -2.0676269195973526e-05, "dbits": 125829120 } ] }, { "idx": 6, "layers": [ "model.layers.1.self_attn.k_proj", "model.layers.1.self_attn.v_proj" ], "candidates": [ { "dkld": 9.082257747650146e-06, "dbits": 10485760 }, { "dkld": 6.920890882611275e-06, "dbits": 20971520 } ] }, { "idx": 7, "layers": [ "model.layers.1.self_attn.o_proj" ], "candidates": [ { "dkld": -2.3826677352189324e-05, "dbits": 62914560 }, { "dkld": -1.555224880576099e-05, "dbits": 125829120 } ] }, { "idx": 8, "layers": [ "model.layers.1.mlp.gate_proj", "model.layers.1.mlp.up_proj" ], "candidates": [ { "dkld": -5.465871654450859e-05, "dbits": 125829120 }, { "dkld": -0.00013767215423285926, "dbits": 251658240 } ] }, { "idx": 9, "layers": [ "model.layers.1.mlp.down_proj" ], "candidates": [ { "dkld": -4.150066524743687e-06, "dbits": 62914560 }, { "dkld": 2.5907158851624923e-05, "dbits": 125829120 } ] }, { "idx": 10, "layers": [ "model.layers.2.self_attn.q_proj" ], "candidates": [ { "dkld": -8.564442396160471e-07, "dbits": 62914560 }, { "dkld": -1.0017445310948891e-05, "dbits": 125829120 } ] }, { "idx": 11, "layers": [ "model.layers.2.self_attn.k_proj", "model.layers.2.self_attn.v_proj" ], "candidates": [ { "dkld": 6.850529462100116e-06, "dbits": 10485760 }, { "dkld": 0.00016430700197815964, "dbits": 20971520 } ] }, { "idx": 12, "layers": [ "model.layers.2.self_attn.o_proj" ], "candidates": [ { "dkld": -5.1201251335441025e-05, "dbits": 62914560 }, { "dkld": -7.7507272362708e-05, "dbits": 125829120 } ] }, { "idx": 13, "layers": [ "model.layers.2.mlp.gate_proj", "model.layers.2.mlp.up_proj" ], "candidates": [ { "dkld": -0.0001994210528209802, "dbits": 125829120 }, { "dkld": -0.0001642897492274628, "dbits": 251658240 } ] }, { "idx": 14, "layers": [ "model.layers.2.mlp.down_proj" ], "candidates": [ { "dkld": -1.1399644427000089e-05, "dbits": 62914560 }, { "dkld": 7.352964021265646e-05, "dbits": 125829120 } ] }, { "idx": 15, "layers": [ "model.layers.3.self_attn.q_proj" ], "candidates": [ { "dkld": -1.1829403229057442e-05, "dbits": 62914560 }, { "dkld": -1.874228473752737e-05, "dbits": 125829120 } ] }, { "idx": 16, "layers": [ "model.layers.3.self_attn.k_proj", "model.layers.3.self_attn.v_proj" ], "candidates": [ { "dkld": -3.541889600455067e-06, "dbits": 10485760 }, { "dkld": -1.5000905841588627e-05, "dbits": 20971520 } ] }, { "idx": 17, "layers": [ "model.layers.3.self_attn.o_proj" ], "candidates": [ { "dkld": -1.3161147944628152e-05, "dbits": 62914560 }, { "dkld": 2.135129179805552e-05, "dbits": 125829120 } ] }, { "idx": 18, "layers": [ "model.layers.3.mlp.shared_experts.gate_proj", "model.layers.3.mlp.shared_experts.up_proj", "model.layers.3.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -7.306593470275333e-05, "dbits": 23592960 }, { "dkld": -4.933353047817911e-05, "dbits": 47185920 } ] }, { "idx": 19, "layers": [ "model.layers.3.mlp.experts.0.gate_proj", "model.layers.3.mlp.experts.1.gate_proj", "model.layers.3.mlp.experts.2.gate_proj", "model.layers.3.mlp.experts.3.gate_proj", "model.layers.3.mlp.experts.4.gate_proj", "model.layers.3.mlp.experts.5.gate_proj", "model.layers.3.mlp.experts.6.gate_proj", "model.layers.3.mlp.experts.7.gate_proj", "model.layers.3.mlp.experts.8.gate_proj", "model.layers.3.mlp.experts.9.gate_proj", "model.layers.3.mlp.experts.10.gate_proj", "model.layers.3.mlp.experts.11.gate_proj", "model.layers.3.mlp.experts.12.gate_proj", "model.layers.3.mlp.experts.13.gate_proj", "model.layers.3.mlp.experts.14.gate_proj", "model.layers.3.mlp.experts.15.gate_proj", "model.layers.3.mlp.experts.16.gate_proj", "model.layers.3.mlp.experts.17.gate_proj", "model.layers.3.mlp.experts.18.gate_proj", "model.layers.3.mlp.experts.19.gate_proj", "model.layers.3.mlp.experts.20.gate_proj", "model.layers.3.mlp.experts.21.gate_proj", "model.layers.3.mlp.experts.22.gate_proj", "model.layers.3.mlp.experts.23.gate_proj", "model.layers.3.mlp.experts.24.gate_proj", "model.layers.3.mlp.experts.25.gate_proj", "model.layers.3.mlp.experts.26.gate_proj", "model.layers.3.mlp.experts.27.gate_proj", "model.layers.3.mlp.experts.28.gate_proj", "model.layers.3.mlp.experts.29.gate_proj", "model.layers.3.mlp.experts.30.gate_proj", "model.layers.3.mlp.experts.31.gate_proj", "model.layers.3.mlp.experts.32.gate_proj", "model.layers.3.mlp.experts.33.gate_proj", "model.layers.3.mlp.experts.34.gate_proj", "model.layers.3.mlp.experts.35.gate_proj", "model.layers.3.mlp.experts.36.gate_proj", "model.layers.3.mlp.experts.37.gate_proj", "model.layers.3.mlp.experts.38.gate_proj", "model.layers.3.mlp.experts.39.gate_proj", "model.layers.3.mlp.experts.40.gate_proj", "model.layers.3.mlp.experts.41.gate_proj", "model.layers.3.mlp.experts.42.gate_proj", "model.layers.3.mlp.experts.43.gate_proj", "model.layers.3.mlp.experts.44.gate_proj", "model.layers.3.mlp.experts.45.gate_proj", "model.layers.3.mlp.experts.46.gate_proj", "model.layers.3.mlp.experts.47.gate_proj", "model.layers.3.mlp.experts.48.gate_proj", "model.layers.3.mlp.experts.49.gate_proj", "model.layers.3.mlp.experts.50.gate_proj", "model.layers.3.mlp.experts.51.gate_proj", "model.layers.3.mlp.experts.52.gate_proj", "model.layers.3.mlp.experts.53.gate_proj", "model.layers.3.mlp.experts.54.gate_proj", "model.layers.3.mlp.experts.55.gate_proj", "model.layers.3.mlp.experts.56.gate_proj", "model.layers.3.mlp.experts.57.gate_proj", "model.layers.3.mlp.experts.58.gate_proj", "model.layers.3.mlp.experts.59.gate_proj", "model.layers.3.mlp.experts.60.gate_proj", "model.layers.3.mlp.experts.61.gate_proj", "model.layers.3.mlp.experts.62.gate_proj", "model.layers.3.mlp.experts.63.gate_proj", "model.layers.3.mlp.experts.64.gate_proj", "model.layers.3.mlp.experts.65.gate_proj", "model.layers.3.mlp.experts.66.gate_proj", "model.layers.3.mlp.experts.67.gate_proj", "model.layers.3.mlp.experts.68.gate_proj", "model.layers.3.mlp.experts.69.gate_proj", "model.layers.3.mlp.experts.70.gate_proj", "model.layers.3.mlp.experts.71.gate_proj", "model.layers.3.mlp.experts.72.gate_proj", "model.layers.3.mlp.experts.73.gate_proj", "model.layers.3.mlp.experts.74.gate_proj", "model.layers.3.mlp.experts.75.gate_proj", "model.layers.3.mlp.experts.76.gate_proj", "model.layers.3.mlp.experts.77.gate_proj", "model.layers.3.mlp.experts.78.gate_proj", "model.layers.3.mlp.experts.79.gate_proj", "model.layers.3.mlp.experts.80.gate_proj", "model.layers.3.mlp.experts.81.gate_proj", "model.layers.3.mlp.experts.82.gate_proj", "model.layers.3.mlp.experts.83.gate_proj", "model.layers.3.mlp.experts.84.gate_proj", "model.layers.3.mlp.experts.85.gate_proj", "model.layers.3.mlp.experts.86.gate_proj", "model.layers.3.mlp.experts.87.gate_proj", "model.layers.3.mlp.experts.88.gate_proj", "model.layers.3.mlp.experts.89.gate_proj", "model.layers.3.mlp.experts.90.gate_proj", "model.layers.3.mlp.experts.91.gate_proj", "model.layers.3.mlp.experts.92.gate_proj", "model.layers.3.mlp.experts.93.gate_proj", "model.layers.3.mlp.experts.94.gate_proj", "model.layers.3.mlp.experts.95.gate_proj", "model.layers.3.mlp.experts.96.gate_proj", "model.layers.3.mlp.experts.97.gate_proj", "model.layers.3.mlp.experts.98.gate_proj", "model.layers.3.mlp.experts.99.gate_proj", "model.layers.3.mlp.experts.100.gate_proj", "model.layers.3.mlp.experts.101.gate_proj", "model.layers.3.mlp.experts.102.gate_proj", "model.layers.3.mlp.experts.103.gate_proj", "model.layers.3.mlp.experts.104.gate_proj", "model.layers.3.mlp.experts.105.gate_proj", "model.layers.3.mlp.experts.106.gate_proj", "model.layers.3.mlp.experts.107.gate_proj", "model.layers.3.mlp.experts.108.gate_proj", "model.layers.3.mlp.experts.109.gate_proj", "model.layers.3.mlp.experts.110.gate_proj", "model.layers.3.mlp.experts.111.gate_proj", "model.layers.3.mlp.experts.112.gate_proj", "model.layers.3.mlp.experts.113.gate_proj", "model.layers.3.mlp.experts.114.gate_proj", "model.layers.3.mlp.experts.115.gate_proj", "model.layers.3.mlp.experts.116.gate_proj", "model.layers.3.mlp.experts.117.gate_proj", "model.layers.3.mlp.experts.118.gate_proj", "model.layers.3.mlp.experts.119.gate_proj", "model.layers.3.mlp.experts.120.gate_proj", "model.layers.3.mlp.experts.121.gate_proj", "model.layers.3.mlp.experts.122.gate_proj", "model.layers.3.mlp.experts.123.gate_proj", "model.layers.3.mlp.experts.124.gate_proj", "model.layers.3.mlp.experts.125.gate_proj", "model.layers.3.mlp.experts.126.gate_proj", "model.layers.3.mlp.experts.127.gate_proj", "model.layers.3.mlp.experts.128.gate_proj", "model.layers.3.mlp.experts.129.gate_proj", "model.layers.3.mlp.experts.130.gate_proj", "model.layers.3.mlp.experts.131.gate_proj", "model.layers.3.mlp.experts.132.gate_proj", "model.layers.3.mlp.experts.133.gate_proj", "model.layers.3.mlp.experts.134.gate_proj", "model.layers.3.mlp.experts.135.gate_proj", "model.layers.3.mlp.experts.136.gate_proj", "model.layers.3.mlp.experts.137.gate_proj", "model.layers.3.mlp.experts.138.gate_proj", "model.layers.3.mlp.experts.139.gate_proj", "model.layers.3.mlp.experts.140.gate_proj", "model.layers.3.mlp.experts.141.gate_proj", "model.layers.3.mlp.experts.142.gate_proj", "model.layers.3.mlp.experts.143.gate_proj", "model.layers.3.mlp.experts.144.gate_proj", "model.layers.3.mlp.experts.145.gate_proj", "model.layers.3.mlp.experts.146.gate_proj", "model.layers.3.mlp.experts.147.gate_proj", "model.layers.3.mlp.experts.148.gate_proj", "model.layers.3.mlp.experts.149.gate_proj", "model.layers.3.mlp.experts.150.gate_proj", "model.layers.3.mlp.experts.151.gate_proj", "model.layers.3.mlp.experts.152.gate_proj", "model.layers.3.mlp.experts.153.gate_proj", "model.layers.3.mlp.experts.154.gate_proj", "model.layers.3.mlp.experts.155.gate_proj", "model.layers.3.mlp.experts.156.gate_proj", "model.layers.3.mlp.experts.157.gate_proj", "model.layers.3.mlp.experts.158.gate_proj", "model.layers.3.mlp.experts.159.gate_proj", "model.layers.3.mlp.experts.0.up_proj", "model.layers.3.mlp.experts.1.up_proj", "model.layers.3.mlp.experts.2.up_proj", "model.layers.3.mlp.experts.3.up_proj", "model.layers.3.mlp.experts.4.up_proj", "model.layers.3.mlp.experts.5.up_proj", "model.layers.3.mlp.experts.6.up_proj", "model.layers.3.mlp.experts.7.up_proj", "model.layers.3.mlp.experts.8.up_proj", "model.layers.3.mlp.experts.9.up_proj", "model.layers.3.mlp.experts.10.up_proj", "model.layers.3.mlp.experts.11.up_proj", "model.layers.3.mlp.experts.12.up_proj", "model.layers.3.mlp.experts.13.up_proj", "model.layers.3.mlp.experts.14.up_proj", "model.layers.3.mlp.experts.15.up_proj", "model.layers.3.mlp.experts.16.up_proj", "model.layers.3.mlp.experts.17.up_proj", "model.layers.3.mlp.experts.18.up_proj", "model.layers.3.mlp.experts.19.up_proj", "model.layers.3.mlp.experts.20.up_proj", "model.layers.3.mlp.experts.21.up_proj", "model.layers.3.mlp.experts.22.up_proj", "model.layers.3.mlp.experts.23.up_proj", "model.layers.3.mlp.experts.24.up_proj", "model.layers.3.mlp.experts.25.up_proj", "model.layers.3.mlp.experts.26.up_proj", "model.layers.3.mlp.experts.27.up_proj", "model.layers.3.mlp.experts.28.up_proj", "model.layers.3.mlp.experts.29.up_proj", "model.layers.3.mlp.experts.30.up_proj", "model.layers.3.mlp.experts.31.up_proj", "model.layers.3.mlp.experts.32.up_proj", "model.layers.3.mlp.experts.33.up_proj", "model.layers.3.mlp.experts.34.up_proj", "model.layers.3.mlp.experts.35.up_proj", "model.layers.3.mlp.experts.36.up_proj", "model.layers.3.mlp.experts.37.up_proj", "model.layers.3.mlp.experts.38.up_proj", "model.layers.3.mlp.experts.39.up_proj", "model.layers.3.mlp.experts.40.up_proj", "model.layers.3.mlp.experts.41.up_proj", "model.layers.3.mlp.experts.42.up_proj", "model.layers.3.mlp.experts.43.up_proj", "model.layers.3.mlp.experts.44.up_proj", "model.layers.3.mlp.experts.45.up_proj", "model.layers.3.mlp.experts.46.up_proj", "model.layers.3.mlp.experts.47.up_proj", "model.layers.3.mlp.experts.48.up_proj", "model.layers.3.mlp.experts.49.up_proj", "model.layers.3.mlp.experts.50.up_proj", "model.layers.3.mlp.experts.51.up_proj", "model.layers.3.mlp.experts.52.up_proj", "model.layers.3.mlp.experts.53.up_proj", "model.layers.3.mlp.experts.54.up_proj", "model.layers.3.mlp.experts.55.up_proj", "model.layers.3.mlp.experts.56.up_proj", "model.layers.3.mlp.experts.57.up_proj", "model.layers.3.mlp.experts.58.up_proj", "model.layers.3.mlp.experts.59.up_proj", "model.layers.3.mlp.experts.60.up_proj", "model.layers.3.mlp.experts.61.up_proj", "model.layers.3.mlp.experts.62.up_proj", "model.layers.3.mlp.experts.63.up_proj", "model.layers.3.mlp.experts.64.up_proj", "model.layers.3.mlp.experts.65.up_proj", "model.layers.3.mlp.experts.66.up_proj", "model.layers.3.mlp.experts.67.up_proj", "model.layers.3.mlp.experts.68.up_proj", "model.layers.3.mlp.experts.69.up_proj", "model.layers.3.mlp.experts.70.up_proj", "model.layers.3.mlp.experts.71.up_proj", "model.layers.3.mlp.experts.72.up_proj", "model.layers.3.mlp.experts.73.up_proj", "model.layers.3.mlp.experts.74.up_proj", "model.layers.3.mlp.experts.75.up_proj", "model.layers.3.mlp.experts.76.up_proj", "model.layers.3.mlp.experts.77.up_proj", "model.layers.3.mlp.experts.78.up_proj", "model.layers.3.mlp.experts.79.up_proj", "model.layers.3.mlp.experts.80.up_proj", "model.layers.3.mlp.experts.81.up_proj", "model.layers.3.mlp.experts.82.up_proj", "model.layers.3.mlp.experts.83.up_proj", "model.layers.3.mlp.experts.84.up_proj", "model.layers.3.mlp.experts.85.up_proj", "model.layers.3.mlp.experts.86.up_proj", "model.layers.3.mlp.experts.87.up_proj", "model.layers.3.mlp.experts.88.up_proj", "model.layers.3.mlp.experts.89.up_proj", "model.layers.3.mlp.experts.90.up_proj", "model.layers.3.mlp.experts.91.up_proj", "model.layers.3.mlp.experts.92.up_proj", "model.layers.3.mlp.experts.93.up_proj", "model.layers.3.mlp.experts.94.up_proj", "model.layers.3.mlp.experts.95.up_proj", "model.layers.3.mlp.experts.96.up_proj", "model.layers.3.mlp.experts.97.up_proj", "model.layers.3.mlp.experts.98.up_proj", "model.layers.3.mlp.experts.99.up_proj", "model.layers.3.mlp.experts.100.up_proj", "model.layers.3.mlp.experts.101.up_proj", "model.layers.3.mlp.experts.102.up_proj", "model.layers.3.mlp.experts.103.up_proj", "model.layers.3.mlp.experts.104.up_proj", "model.layers.3.mlp.experts.105.up_proj", "model.layers.3.mlp.experts.106.up_proj", "model.layers.3.mlp.experts.107.up_proj", "model.layers.3.mlp.experts.108.up_proj", "model.layers.3.mlp.experts.109.up_proj", "model.layers.3.mlp.experts.110.up_proj", "model.layers.3.mlp.experts.111.up_proj", "model.layers.3.mlp.experts.112.up_proj", "model.layers.3.mlp.experts.113.up_proj", "model.layers.3.mlp.experts.114.up_proj", "model.layers.3.mlp.experts.115.up_proj", "model.layers.3.mlp.experts.116.up_proj", "model.layers.3.mlp.experts.117.up_proj", "model.layers.3.mlp.experts.118.up_proj", "model.layers.3.mlp.experts.119.up_proj", "model.layers.3.mlp.experts.120.up_proj", "model.layers.3.mlp.experts.121.up_proj", "model.layers.3.mlp.experts.122.up_proj", "model.layers.3.mlp.experts.123.up_proj", "model.layers.3.mlp.experts.124.up_proj", "model.layers.3.mlp.experts.125.up_proj", "model.layers.3.mlp.experts.126.up_proj", "model.layers.3.mlp.experts.127.up_proj", "model.layers.3.mlp.experts.128.up_proj", "model.layers.3.mlp.experts.129.up_proj", "model.layers.3.mlp.experts.130.up_proj", "model.layers.3.mlp.experts.131.up_proj", "model.layers.3.mlp.experts.132.up_proj", "model.layers.3.mlp.experts.133.up_proj", "model.layers.3.mlp.experts.134.up_proj", "model.layers.3.mlp.experts.135.up_proj", "model.layers.3.mlp.experts.136.up_proj", "model.layers.3.mlp.experts.137.up_proj", "model.layers.3.mlp.experts.138.up_proj", "model.layers.3.mlp.experts.139.up_proj", "model.layers.3.mlp.experts.140.up_proj", "model.layers.3.mlp.experts.141.up_proj", "model.layers.3.mlp.experts.142.up_proj", "model.layers.3.mlp.experts.143.up_proj", "model.layers.3.mlp.experts.144.up_proj", "model.layers.3.mlp.experts.145.up_proj", "model.layers.3.mlp.experts.146.up_proj", "model.layers.3.mlp.experts.147.up_proj", "model.layers.3.mlp.experts.148.up_proj", "model.layers.3.mlp.experts.149.up_proj", "model.layers.3.mlp.experts.150.up_proj", "model.layers.3.mlp.experts.151.up_proj", "model.layers.3.mlp.experts.152.up_proj", "model.layers.3.mlp.experts.153.up_proj", "model.layers.3.mlp.experts.154.up_proj", "model.layers.3.mlp.experts.155.up_proj", "model.layers.3.mlp.experts.156.up_proj", "model.layers.3.mlp.experts.157.up_proj", "model.layers.3.mlp.experts.158.up_proj", "model.layers.3.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.5156506560741814e-05, "dbits": 2516582400 }, { "dkld": -2.2729206830262097e-05, "dbits": 5033164800 } ] }, { "idx": 20, "layers": [ "model.layers.3.mlp.experts.0.down_proj", "model.layers.3.mlp.experts.1.down_proj", "model.layers.3.mlp.experts.2.down_proj", "model.layers.3.mlp.experts.3.down_proj", "model.layers.3.mlp.experts.4.down_proj", "model.layers.3.mlp.experts.5.down_proj", "model.layers.3.mlp.experts.6.down_proj", "model.layers.3.mlp.experts.7.down_proj", "model.layers.3.mlp.experts.8.down_proj", "model.layers.3.mlp.experts.9.down_proj", "model.layers.3.mlp.experts.10.down_proj", "model.layers.3.mlp.experts.11.down_proj", "model.layers.3.mlp.experts.12.down_proj", "model.layers.3.mlp.experts.13.down_proj", "model.layers.3.mlp.experts.14.down_proj", "model.layers.3.mlp.experts.15.down_proj", "model.layers.3.mlp.experts.16.down_proj", "model.layers.3.mlp.experts.17.down_proj", "model.layers.3.mlp.experts.18.down_proj", "model.layers.3.mlp.experts.19.down_proj", "model.layers.3.mlp.experts.20.down_proj", "model.layers.3.mlp.experts.21.down_proj", "model.layers.3.mlp.experts.22.down_proj", "model.layers.3.mlp.experts.23.down_proj", "model.layers.3.mlp.experts.24.down_proj", "model.layers.3.mlp.experts.25.down_proj", "model.layers.3.mlp.experts.26.down_proj", "model.layers.3.mlp.experts.27.down_proj", "model.layers.3.mlp.experts.28.down_proj", "model.layers.3.mlp.experts.29.down_proj", "model.layers.3.mlp.experts.30.down_proj", "model.layers.3.mlp.experts.31.down_proj", "model.layers.3.mlp.experts.32.down_proj", "model.layers.3.mlp.experts.33.down_proj", "model.layers.3.mlp.experts.34.down_proj", "model.layers.3.mlp.experts.35.down_proj", "model.layers.3.mlp.experts.36.down_proj", "model.layers.3.mlp.experts.37.down_proj", "model.layers.3.mlp.experts.38.down_proj", "model.layers.3.mlp.experts.39.down_proj", "model.layers.3.mlp.experts.40.down_proj", "model.layers.3.mlp.experts.41.down_proj", "model.layers.3.mlp.experts.42.down_proj", "model.layers.3.mlp.experts.43.down_proj", "model.layers.3.mlp.experts.44.down_proj", "model.layers.3.mlp.experts.45.down_proj", "model.layers.3.mlp.experts.46.down_proj", "model.layers.3.mlp.experts.47.down_proj", "model.layers.3.mlp.experts.48.down_proj", "model.layers.3.mlp.experts.49.down_proj", "model.layers.3.mlp.experts.50.down_proj", "model.layers.3.mlp.experts.51.down_proj", "model.layers.3.mlp.experts.52.down_proj", "model.layers.3.mlp.experts.53.down_proj", "model.layers.3.mlp.experts.54.down_proj", "model.layers.3.mlp.experts.55.down_proj", "model.layers.3.mlp.experts.56.down_proj", "model.layers.3.mlp.experts.57.down_proj", "model.layers.3.mlp.experts.58.down_proj", "model.layers.3.mlp.experts.59.down_proj", "model.layers.3.mlp.experts.60.down_proj", "model.layers.3.mlp.experts.61.down_proj", "model.layers.3.mlp.experts.62.down_proj", "model.layers.3.mlp.experts.63.down_proj", "model.layers.3.mlp.experts.64.down_proj", "model.layers.3.mlp.experts.65.down_proj", "model.layers.3.mlp.experts.66.down_proj", "model.layers.3.mlp.experts.67.down_proj", "model.layers.3.mlp.experts.68.down_proj", "model.layers.3.mlp.experts.69.down_proj", "model.layers.3.mlp.experts.70.down_proj", "model.layers.3.mlp.experts.71.down_proj", "model.layers.3.mlp.experts.72.down_proj", "model.layers.3.mlp.experts.73.down_proj", "model.layers.3.mlp.experts.74.down_proj", "model.layers.3.mlp.experts.75.down_proj", "model.layers.3.mlp.experts.76.down_proj", "model.layers.3.mlp.experts.77.down_proj", "model.layers.3.mlp.experts.78.down_proj", "model.layers.3.mlp.experts.79.down_proj", "model.layers.3.mlp.experts.80.down_proj", "model.layers.3.mlp.experts.81.down_proj", "model.layers.3.mlp.experts.82.down_proj", "model.layers.3.mlp.experts.83.down_proj", "model.layers.3.mlp.experts.84.down_proj", "model.layers.3.mlp.experts.85.down_proj", "model.layers.3.mlp.experts.86.down_proj", "model.layers.3.mlp.experts.87.down_proj", "model.layers.3.mlp.experts.88.down_proj", "model.layers.3.mlp.experts.89.down_proj", "model.layers.3.mlp.experts.90.down_proj", "model.layers.3.mlp.experts.91.down_proj", "model.layers.3.mlp.experts.92.down_proj", "model.layers.3.mlp.experts.93.down_proj", "model.layers.3.mlp.experts.94.down_proj", "model.layers.3.mlp.experts.95.down_proj", "model.layers.3.mlp.experts.96.down_proj", "model.layers.3.mlp.experts.97.down_proj", "model.layers.3.mlp.experts.98.down_proj", "model.layers.3.mlp.experts.99.down_proj", "model.layers.3.mlp.experts.100.down_proj", "model.layers.3.mlp.experts.101.down_proj", "model.layers.3.mlp.experts.102.down_proj", "model.layers.3.mlp.experts.103.down_proj", "model.layers.3.mlp.experts.104.down_proj", "model.layers.3.mlp.experts.105.down_proj", "model.layers.3.mlp.experts.106.down_proj", "model.layers.3.mlp.experts.107.down_proj", "model.layers.3.mlp.experts.108.down_proj", "model.layers.3.mlp.experts.109.down_proj", "model.layers.3.mlp.experts.110.down_proj", "model.layers.3.mlp.experts.111.down_proj", "model.layers.3.mlp.experts.112.down_proj", "model.layers.3.mlp.experts.113.down_proj", "model.layers.3.mlp.experts.114.down_proj", "model.layers.3.mlp.experts.115.down_proj", "model.layers.3.mlp.experts.116.down_proj", "model.layers.3.mlp.experts.117.down_proj", "model.layers.3.mlp.experts.118.down_proj", "model.layers.3.mlp.experts.119.down_proj", "model.layers.3.mlp.experts.120.down_proj", "model.layers.3.mlp.experts.121.down_proj", "model.layers.3.mlp.experts.122.down_proj", "model.layers.3.mlp.experts.123.down_proj", "model.layers.3.mlp.experts.124.down_proj", "model.layers.3.mlp.experts.125.down_proj", "model.layers.3.mlp.experts.126.down_proj", "model.layers.3.mlp.experts.127.down_proj", "model.layers.3.mlp.experts.128.down_proj", "model.layers.3.mlp.experts.129.down_proj", "model.layers.3.mlp.experts.130.down_proj", "model.layers.3.mlp.experts.131.down_proj", "model.layers.3.mlp.experts.132.down_proj", "model.layers.3.mlp.experts.133.down_proj", "model.layers.3.mlp.experts.134.down_proj", "model.layers.3.mlp.experts.135.down_proj", "model.layers.3.mlp.experts.136.down_proj", "model.layers.3.mlp.experts.137.down_proj", "model.layers.3.mlp.experts.138.down_proj", "model.layers.3.mlp.experts.139.down_proj", "model.layers.3.mlp.experts.140.down_proj", "model.layers.3.mlp.experts.141.down_proj", "model.layers.3.mlp.experts.142.down_proj", "model.layers.3.mlp.experts.143.down_proj", "model.layers.3.mlp.experts.144.down_proj", "model.layers.3.mlp.experts.145.down_proj", "model.layers.3.mlp.experts.146.down_proj", "model.layers.3.mlp.experts.147.down_proj", "model.layers.3.mlp.experts.148.down_proj", "model.layers.3.mlp.experts.149.down_proj", "model.layers.3.mlp.experts.150.down_proj", "model.layers.3.mlp.experts.151.down_proj", "model.layers.3.mlp.experts.152.down_proj", "model.layers.3.mlp.experts.153.down_proj", "model.layers.3.mlp.experts.154.down_proj", "model.layers.3.mlp.experts.155.down_proj", "model.layers.3.mlp.experts.156.down_proj", "model.layers.3.mlp.experts.157.down_proj", "model.layers.3.mlp.experts.158.down_proj", "model.layers.3.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -5.830342415720155e-05, "dbits": 1258291200 }, { "dkld": -2.1534762345253033e-05, "dbits": 2516582400 } ] }, { "idx": 21, "layers": [ "model.layers.4.self_attn.q_proj" ], "candidates": [ { "dkld": -4.662515129894018e-05, "dbits": 62914560 }, { "dkld": -1.1541647836552094e-06, "dbits": 125829120 } ] }, { "idx": 22, "layers": [ "model.layers.4.self_attn.k_proj", "model.layers.4.self_attn.v_proj" ], "candidates": [ { "dkld": -0.000126368319615721, "dbits": 10485760 }, { "dkld": -0.00010706661269068579, "dbits": 20971520 } ] }, { "idx": 23, "layers": [ "model.layers.4.self_attn.o_proj" ], "candidates": [ { "dkld": -1.2440374121069908e-05, "dbits": 62914560 }, { "dkld": -1.1059106327593327e-05, "dbits": 125829120 } ] }, { "idx": 24, "layers": [ "model.layers.4.mlp.shared_experts.gate_proj", "model.layers.4.mlp.shared_experts.up_proj", "model.layers.4.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -4.37291106209145e-05, "dbits": 23592960 }, { "dkld": -5.621900781989028e-05, "dbits": 47185920 } ] }, { "idx": 25, "layers": [ "model.layers.4.mlp.experts.0.gate_proj", "model.layers.4.mlp.experts.1.gate_proj", "model.layers.4.mlp.experts.2.gate_proj", "model.layers.4.mlp.experts.3.gate_proj", "model.layers.4.mlp.experts.4.gate_proj", "model.layers.4.mlp.experts.5.gate_proj", "model.layers.4.mlp.experts.6.gate_proj", "model.layers.4.mlp.experts.7.gate_proj", "model.layers.4.mlp.experts.8.gate_proj", "model.layers.4.mlp.experts.9.gate_proj", "model.layers.4.mlp.experts.10.gate_proj", "model.layers.4.mlp.experts.11.gate_proj", "model.layers.4.mlp.experts.12.gate_proj", "model.layers.4.mlp.experts.13.gate_proj", "model.layers.4.mlp.experts.14.gate_proj", "model.layers.4.mlp.experts.15.gate_proj", "model.layers.4.mlp.experts.16.gate_proj", "model.layers.4.mlp.experts.17.gate_proj", "model.layers.4.mlp.experts.18.gate_proj", "model.layers.4.mlp.experts.19.gate_proj", "model.layers.4.mlp.experts.20.gate_proj", "model.layers.4.mlp.experts.21.gate_proj", "model.layers.4.mlp.experts.22.gate_proj", "model.layers.4.mlp.experts.23.gate_proj", "model.layers.4.mlp.experts.24.gate_proj", "model.layers.4.mlp.experts.25.gate_proj", "model.layers.4.mlp.experts.26.gate_proj", "model.layers.4.mlp.experts.27.gate_proj", "model.layers.4.mlp.experts.28.gate_proj", "model.layers.4.mlp.experts.29.gate_proj", "model.layers.4.mlp.experts.30.gate_proj", "model.layers.4.mlp.experts.31.gate_proj", "model.layers.4.mlp.experts.32.gate_proj", "model.layers.4.mlp.experts.33.gate_proj", "model.layers.4.mlp.experts.34.gate_proj", "model.layers.4.mlp.experts.35.gate_proj", "model.layers.4.mlp.experts.36.gate_proj", "model.layers.4.mlp.experts.37.gate_proj", "model.layers.4.mlp.experts.38.gate_proj", "model.layers.4.mlp.experts.39.gate_proj", "model.layers.4.mlp.experts.40.gate_proj", "model.layers.4.mlp.experts.41.gate_proj", "model.layers.4.mlp.experts.42.gate_proj", "model.layers.4.mlp.experts.43.gate_proj", "model.layers.4.mlp.experts.44.gate_proj", "model.layers.4.mlp.experts.45.gate_proj", "model.layers.4.mlp.experts.46.gate_proj", "model.layers.4.mlp.experts.47.gate_proj", "model.layers.4.mlp.experts.48.gate_proj", "model.layers.4.mlp.experts.49.gate_proj", "model.layers.4.mlp.experts.50.gate_proj", "model.layers.4.mlp.experts.51.gate_proj", "model.layers.4.mlp.experts.52.gate_proj", "model.layers.4.mlp.experts.53.gate_proj", "model.layers.4.mlp.experts.54.gate_proj", "model.layers.4.mlp.experts.55.gate_proj", "model.layers.4.mlp.experts.56.gate_proj", "model.layers.4.mlp.experts.57.gate_proj", "model.layers.4.mlp.experts.58.gate_proj", "model.layers.4.mlp.experts.59.gate_proj", "model.layers.4.mlp.experts.60.gate_proj", "model.layers.4.mlp.experts.61.gate_proj", "model.layers.4.mlp.experts.62.gate_proj", "model.layers.4.mlp.experts.63.gate_proj", "model.layers.4.mlp.experts.64.gate_proj", "model.layers.4.mlp.experts.65.gate_proj", "model.layers.4.mlp.experts.66.gate_proj", "model.layers.4.mlp.experts.67.gate_proj", "model.layers.4.mlp.experts.68.gate_proj", "model.layers.4.mlp.experts.69.gate_proj", "model.layers.4.mlp.experts.70.gate_proj", "model.layers.4.mlp.experts.71.gate_proj", "model.layers.4.mlp.experts.72.gate_proj", "model.layers.4.mlp.experts.73.gate_proj", "model.layers.4.mlp.experts.74.gate_proj", "model.layers.4.mlp.experts.75.gate_proj", "model.layers.4.mlp.experts.76.gate_proj", "model.layers.4.mlp.experts.77.gate_proj", "model.layers.4.mlp.experts.78.gate_proj", "model.layers.4.mlp.experts.79.gate_proj", "model.layers.4.mlp.experts.80.gate_proj", "model.layers.4.mlp.experts.81.gate_proj", "model.layers.4.mlp.experts.82.gate_proj", "model.layers.4.mlp.experts.83.gate_proj", "model.layers.4.mlp.experts.84.gate_proj", "model.layers.4.mlp.experts.85.gate_proj", "model.layers.4.mlp.experts.86.gate_proj", "model.layers.4.mlp.experts.87.gate_proj", "model.layers.4.mlp.experts.88.gate_proj", "model.layers.4.mlp.experts.89.gate_proj", "model.layers.4.mlp.experts.90.gate_proj", "model.layers.4.mlp.experts.91.gate_proj", "model.layers.4.mlp.experts.92.gate_proj", "model.layers.4.mlp.experts.93.gate_proj", "model.layers.4.mlp.experts.94.gate_proj", "model.layers.4.mlp.experts.95.gate_proj", "model.layers.4.mlp.experts.96.gate_proj", "model.layers.4.mlp.experts.97.gate_proj", "model.layers.4.mlp.experts.98.gate_proj", "model.layers.4.mlp.experts.99.gate_proj", "model.layers.4.mlp.experts.100.gate_proj", "model.layers.4.mlp.experts.101.gate_proj", "model.layers.4.mlp.experts.102.gate_proj", "model.layers.4.mlp.experts.103.gate_proj", "model.layers.4.mlp.experts.104.gate_proj", "model.layers.4.mlp.experts.105.gate_proj", "model.layers.4.mlp.experts.106.gate_proj", "model.layers.4.mlp.experts.107.gate_proj", "model.layers.4.mlp.experts.108.gate_proj", "model.layers.4.mlp.experts.109.gate_proj", "model.layers.4.mlp.experts.110.gate_proj", "model.layers.4.mlp.experts.111.gate_proj", "model.layers.4.mlp.experts.112.gate_proj", "model.layers.4.mlp.experts.113.gate_proj", "model.layers.4.mlp.experts.114.gate_proj", "model.layers.4.mlp.experts.115.gate_proj", "model.layers.4.mlp.experts.116.gate_proj", "model.layers.4.mlp.experts.117.gate_proj", "model.layers.4.mlp.experts.118.gate_proj", "model.layers.4.mlp.experts.119.gate_proj", "model.layers.4.mlp.experts.120.gate_proj", "model.layers.4.mlp.experts.121.gate_proj", "model.layers.4.mlp.experts.122.gate_proj", "model.layers.4.mlp.experts.123.gate_proj", "model.layers.4.mlp.experts.124.gate_proj", "model.layers.4.mlp.experts.125.gate_proj", "model.layers.4.mlp.experts.126.gate_proj", "model.layers.4.mlp.experts.127.gate_proj", "model.layers.4.mlp.experts.128.gate_proj", "model.layers.4.mlp.experts.129.gate_proj", "model.layers.4.mlp.experts.130.gate_proj", "model.layers.4.mlp.experts.131.gate_proj", "model.layers.4.mlp.experts.132.gate_proj", "model.layers.4.mlp.experts.133.gate_proj", "model.layers.4.mlp.experts.134.gate_proj", "model.layers.4.mlp.experts.135.gate_proj", "model.layers.4.mlp.experts.136.gate_proj", "model.layers.4.mlp.experts.137.gate_proj", "model.layers.4.mlp.experts.138.gate_proj", "model.layers.4.mlp.experts.139.gate_proj", "model.layers.4.mlp.experts.140.gate_proj", "model.layers.4.mlp.experts.141.gate_proj", "model.layers.4.mlp.experts.142.gate_proj", "model.layers.4.mlp.experts.143.gate_proj", "model.layers.4.mlp.experts.144.gate_proj", "model.layers.4.mlp.experts.145.gate_proj", "model.layers.4.mlp.experts.146.gate_proj", "model.layers.4.mlp.experts.147.gate_proj", "model.layers.4.mlp.experts.148.gate_proj", "model.layers.4.mlp.experts.149.gate_proj", "model.layers.4.mlp.experts.150.gate_proj", "model.layers.4.mlp.experts.151.gate_proj", "model.layers.4.mlp.experts.152.gate_proj", "model.layers.4.mlp.experts.153.gate_proj", "model.layers.4.mlp.experts.154.gate_proj", "model.layers.4.mlp.experts.155.gate_proj", "model.layers.4.mlp.experts.156.gate_proj", "model.layers.4.mlp.experts.157.gate_proj", "model.layers.4.mlp.experts.158.gate_proj", "model.layers.4.mlp.experts.159.gate_proj", "model.layers.4.mlp.experts.0.up_proj", "model.layers.4.mlp.experts.1.up_proj", "model.layers.4.mlp.experts.2.up_proj", "model.layers.4.mlp.experts.3.up_proj", "model.layers.4.mlp.experts.4.up_proj", "model.layers.4.mlp.experts.5.up_proj", "model.layers.4.mlp.experts.6.up_proj", "model.layers.4.mlp.experts.7.up_proj", "model.layers.4.mlp.experts.8.up_proj", "model.layers.4.mlp.experts.9.up_proj", "model.layers.4.mlp.experts.10.up_proj", "model.layers.4.mlp.experts.11.up_proj", "model.layers.4.mlp.experts.12.up_proj", "model.layers.4.mlp.experts.13.up_proj", "model.layers.4.mlp.experts.14.up_proj", "model.layers.4.mlp.experts.15.up_proj", "model.layers.4.mlp.experts.16.up_proj", "model.layers.4.mlp.experts.17.up_proj", "model.layers.4.mlp.experts.18.up_proj", "model.layers.4.mlp.experts.19.up_proj", "model.layers.4.mlp.experts.20.up_proj", "model.layers.4.mlp.experts.21.up_proj", "model.layers.4.mlp.experts.22.up_proj", "model.layers.4.mlp.experts.23.up_proj", "model.layers.4.mlp.experts.24.up_proj", "model.layers.4.mlp.experts.25.up_proj", "model.layers.4.mlp.experts.26.up_proj", "model.layers.4.mlp.experts.27.up_proj", "model.layers.4.mlp.experts.28.up_proj", "model.layers.4.mlp.experts.29.up_proj", "model.layers.4.mlp.experts.30.up_proj", "model.layers.4.mlp.experts.31.up_proj", "model.layers.4.mlp.experts.32.up_proj", "model.layers.4.mlp.experts.33.up_proj", "model.layers.4.mlp.experts.34.up_proj", "model.layers.4.mlp.experts.35.up_proj", "model.layers.4.mlp.experts.36.up_proj", "model.layers.4.mlp.experts.37.up_proj", "model.layers.4.mlp.experts.38.up_proj", "model.layers.4.mlp.experts.39.up_proj", "model.layers.4.mlp.experts.40.up_proj", "model.layers.4.mlp.experts.41.up_proj", "model.layers.4.mlp.experts.42.up_proj", "model.layers.4.mlp.experts.43.up_proj", "model.layers.4.mlp.experts.44.up_proj", "model.layers.4.mlp.experts.45.up_proj", "model.layers.4.mlp.experts.46.up_proj", "model.layers.4.mlp.experts.47.up_proj", "model.layers.4.mlp.experts.48.up_proj", "model.layers.4.mlp.experts.49.up_proj", "model.layers.4.mlp.experts.50.up_proj", "model.layers.4.mlp.experts.51.up_proj", "model.layers.4.mlp.experts.52.up_proj", "model.layers.4.mlp.experts.53.up_proj", "model.layers.4.mlp.experts.54.up_proj", "model.layers.4.mlp.experts.55.up_proj", "model.layers.4.mlp.experts.56.up_proj", "model.layers.4.mlp.experts.57.up_proj", "model.layers.4.mlp.experts.58.up_proj", "model.layers.4.mlp.experts.59.up_proj", "model.layers.4.mlp.experts.60.up_proj", "model.layers.4.mlp.experts.61.up_proj", "model.layers.4.mlp.experts.62.up_proj", "model.layers.4.mlp.experts.63.up_proj", "model.layers.4.mlp.experts.64.up_proj", "model.layers.4.mlp.experts.65.up_proj", "model.layers.4.mlp.experts.66.up_proj", "model.layers.4.mlp.experts.67.up_proj", "model.layers.4.mlp.experts.68.up_proj", "model.layers.4.mlp.experts.69.up_proj", "model.layers.4.mlp.experts.70.up_proj", "model.layers.4.mlp.experts.71.up_proj", "model.layers.4.mlp.experts.72.up_proj", "model.layers.4.mlp.experts.73.up_proj", "model.layers.4.mlp.experts.74.up_proj", "model.layers.4.mlp.experts.75.up_proj", "model.layers.4.mlp.experts.76.up_proj", "model.layers.4.mlp.experts.77.up_proj", "model.layers.4.mlp.experts.78.up_proj", "model.layers.4.mlp.experts.79.up_proj", "model.layers.4.mlp.experts.80.up_proj", "model.layers.4.mlp.experts.81.up_proj", "model.layers.4.mlp.experts.82.up_proj", "model.layers.4.mlp.experts.83.up_proj", "model.layers.4.mlp.experts.84.up_proj", "model.layers.4.mlp.experts.85.up_proj", "model.layers.4.mlp.experts.86.up_proj", "model.layers.4.mlp.experts.87.up_proj", "model.layers.4.mlp.experts.88.up_proj", "model.layers.4.mlp.experts.89.up_proj", "model.layers.4.mlp.experts.90.up_proj", "model.layers.4.mlp.experts.91.up_proj", "model.layers.4.mlp.experts.92.up_proj", "model.layers.4.mlp.experts.93.up_proj", "model.layers.4.mlp.experts.94.up_proj", "model.layers.4.mlp.experts.95.up_proj", "model.layers.4.mlp.experts.96.up_proj", "model.layers.4.mlp.experts.97.up_proj", "model.layers.4.mlp.experts.98.up_proj", "model.layers.4.mlp.experts.99.up_proj", "model.layers.4.mlp.experts.100.up_proj", "model.layers.4.mlp.experts.101.up_proj", "model.layers.4.mlp.experts.102.up_proj", "model.layers.4.mlp.experts.103.up_proj", "model.layers.4.mlp.experts.104.up_proj", "model.layers.4.mlp.experts.105.up_proj", "model.layers.4.mlp.experts.106.up_proj", "model.layers.4.mlp.experts.107.up_proj", "model.layers.4.mlp.experts.108.up_proj", "model.layers.4.mlp.experts.109.up_proj", "model.layers.4.mlp.experts.110.up_proj", "model.layers.4.mlp.experts.111.up_proj", "model.layers.4.mlp.experts.112.up_proj", "model.layers.4.mlp.experts.113.up_proj", "model.layers.4.mlp.experts.114.up_proj", "model.layers.4.mlp.experts.115.up_proj", "model.layers.4.mlp.experts.116.up_proj", "model.layers.4.mlp.experts.117.up_proj", "model.layers.4.mlp.experts.118.up_proj", "model.layers.4.mlp.experts.119.up_proj", "model.layers.4.mlp.experts.120.up_proj", "model.layers.4.mlp.experts.121.up_proj", "model.layers.4.mlp.experts.122.up_proj", "model.layers.4.mlp.experts.123.up_proj", "model.layers.4.mlp.experts.124.up_proj", "model.layers.4.mlp.experts.125.up_proj", "model.layers.4.mlp.experts.126.up_proj", "model.layers.4.mlp.experts.127.up_proj", "model.layers.4.mlp.experts.128.up_proj", "model.layers.4.mlp.experts.129.up_proj", "model.layers.4.mlp.experts.130.up_proj", "model.layers.4.mlp.experts.131.up_proj", "model.layers.4.mlp.experts.132.up_proj", "model.layers.4.mlp.experts.133.up_proj", "model.layers.4.mlp.experts.134.up_proj", "model.layers.4.mlp.experts.135.up_proj", "model.layers.4.mlp.experts.136.up_proj", "model.layers.4.mlp.experts.137.up_proj", "model.layers.4.mlp.experts.138.up_proj", "model.layers.4.mlp.experts.139.up_proj", "model.layers.4.mlp.experts.140.up_proj", "model.layers.4.mlp.experts.141.up_proj", "model.layers.4.mlp.experts.142.up_proj", "model.layers.4.mlp.experts.143.up_proj", "model.layers.4.mlp.experts.144.up_proj", "model.layers.4.mlp.experts.145.up_proj", "model.layers.4.mlp.experts.146.up_proj", "model.layers.4.mlp.experts.147.up_proj", "model.layers.4.mlp.experts.148.up_proj", "model.layers.4.mlp.experts.149.up_proj", "model.layers.4.mlp.experts.150.up_proj", "model.layers.4.mlp.experts.151.up_proj", "model.layers.4.mlp.experts.152.up_proj", "model.layers.4.mlp.experts.153.up_proj", "model.layers.4.mlp.experts.154.up_proj", "model.layers.4.mlp.experts.155.up_proj", "model.layers.4.mlp.experts.156.up_proj", "model.layers.4.mlp.experts.157.up_proj", "model.layers.4.mlp.experts.158.up_proj", "model.layers.4.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -4.8217852599917455e-05, "dbits": 2516582400 }, { "dkld": -8.144928142428398e-05, "dbits": 5033164800 } ] }, { "idx": 26, "layers": [ "model.layers.4.mlp.experts.0.down_proj", "model.layers.4.mlp.experts.1.down_proj", "model.layers.4.mlp.experts.2.down_proj", "model.layers.4.mlp.experts.3.down_proj", "model.layers.4.mlp.experts.4.down_proj", "model.layers.4.mlp.experts.5.down_proj", "model.layers.4.mlp.experts.6.down_proj", "model.layers.4.mlp.experts.7.down_proj", "model.layers.4.mlp.experts.8.down_proj", "model.layers.4.mlp.experts.9.down_proj", "model.layers.4.mlp.experts.10.down_proj", "model.layers.4.mlp.experts.11.down_proj", "model.layers.4.mlp.experts.12.down_proj", "model.layers.4.mlp.experts.13.down_proj", "model.layers.4.mlp.experts.14.down_proj", "model.layers.4.mlp.experts.15.down_proj", "model.layers.4.mlp.experts.16.down_proj", "model.layers.4.mlp.experts.17.down_proj", "model.layers.4.mlp.experts.18.down_proj", "model.layers.4.mlp.experts.19.down_proj", "model.layers.4.mlp.experts.20.down_proj", "model.layers.4.mlp.experts.21.down_proj", "model.layers.4.mlp.experts.22.down_proj", "model.layers.4.mlp.experts.23.down_proj", "model.layers.4.mlp.experts.24.down_proj", "model.layers.4.mlp.experts.25.down_proj", "model.layers.4.mlp.experts.26.down_proj", "model.layers.4.mlp.experts.27.down_proj", "model.layers.4.mlp.experts.28.down_proj", "model.layers.4.mlp.experts.29.down_proj", "model.layers.4.mlp.experts.30.down_proj", "model.layers.4.mlp.experts.31.down_proj", "model.layers.4.mlp.experts.32.down_proj", "model.layers.4.mlp.experts.33.down_proj", "model.layers.4.mlp.experts.34.down_proj", "model.layers.4.mlp.experts.35.down_proj", "model.layers.4.mlp.experts.36.down_proj", "model.layers.4.mlp.experts.37.down_proj", "model.layers.4.mlp.experts.38.down_proj", "model.layers.4.mlp.experts.39.down_proj", "model.layers.4.mlp.experts.40.down_proj", "model.layers.4.mlp.experts.41.down_proj", "model.layers.4.mlp.experts.42.down_proj", "model.layers.4.mlp.experts.43.down_proj", "model.layers.4.mlp.experts.44.down_proj", "model.layers.4.mlp.experts.45.down_proj", "model.layers.4.mlp.experts.46.down_proj", "model.layers.4.mlp.experts.47.down_proj", "model.layers.4.mlp.experts.48.down_proj", "model.layers.4.mlp.experts.49.down_proj", "model.layers.4.mlp.experts.50.down_proj", "model.layers.4.mlp.experts.51.down_proj", "model.layers.4.mlp.experts.52.down_proj", "model.layers.4.mlp.experts.53.down_proj", "model.layers.4.mlp.experts.54.down_proj", "model.layers.4.mlp.experts.55.down_proj", "model.layers.4.mlp.experts.56.down_proj", "model.layers.4.mlp.experts.57.down_proj", "model.layers.4.mlp.experts.58.down_proj", "model.layers.4.mlp.experts.59.down_proj", "model.layers.4.mlp.experts.60.down_proj", "model.layers.4.mlp.experts.61.down_proj", "model.layers.4.mlp.experts.62.down_proj", "model.layers.4.mlp.experts.63.down_proj", "model.layers.4.mlp.experts.64.down_proj", "model.layers.4.mlp.experts.65.down_proj", "model.layers.4.mlp.experts.66.down_proj", "model.layers.4.mlp.experts.67.down_proj", "model.layers.4.mlp.experts.68.down_proj", "model.layers.4.mlp.experts.69.down_proj", "model.layers.4.mlp.experts.70.down_proj", "model.layers.4.mlp.experts.71.down_proj", "model.layers.4.mlp.experts.72.down_proj", "model.layers.4.mlp.experts.73.down_proj", "model.layers.4.mlp.experts.74.down_proj", "model.layers.4.mlp.experts.75.down_proj", "model.layers.4.mlp.experts.76.down_proj", "model.layers.4.mlp.experts.77.down_proj", "model.layers.4.mlp.experts.78.down_proj", "model.layers.4.mlp.experts.79.down_proj", "model.layers.4.mlp.experts.80.down_proj", "model.layers.4.mlp.experts.81.down_proj", "model.layers.4.mlp.experts.82.down_proj", "model.layers.4.mlp.experts.83.down_proj", "model.layers.4.mlp.experts.84.down_proj", "model.layers.4.mlp.experts.85.down_proj", "model.layers.4.mlp.experts.86.down_proj", "model.layers.4.mlp.experts.87.down_proj", "model.layers.4.mlp.experts.88.down_proj", "model.layers.4.mlp.experts.89.down_proj", "model.layers.4.mlp.experts.90.down_proj", "model.layers.4.mlp.experts.91.down_proj", "model.layers.4.mlp.experts.92.down_proj", "model.layers.4.mlp.experts.93.down_proj", "model.layers.4.mlp.experts.94.down_proj", "model.layers.4.mlp.experts.95.down_proj", "model.layers.4.mlp.experts.96.down_proj", "model.layers.4.mlp.experts.97.down_proj", "model.layers.4.mlp.experts.98.down_proj", "model.layers.4.mlp.experts.99.down_proj", "model.layers.4.mlp.experts.100.down_proj", "model.layers.4.mlp.experts.101.down_proj", "model.layers.4.mlp.experts.102.down_proj", "model.layers.4.mlp.experts.103.down_proj", "model.layers.4.mlp.experts.104.down_proj", "model.layers.4.mlp.experts.105.down_proj", "model.layers.4.mlp.experts.106.down_proj", "model.layers.4.mlp.experts.107.down_proj", "model.layers.4.mlp.experts.108.down_proj", "model.layers.4.mlp.experts.109.down_proj", "model.layers.4.mlp.experts.110.down_proj", "model.layers.4.mlp.experts.111.down_proj", "model.layers.4.mlp.experts.112.down_proj", "model.layers.4.mlp.experts.113.down_proj", "model.layers.4.mlp.experts.114.down_proj", "model.layers.4.mlp.experts.115.down_proj", "model.layers.4.mlp.experts.116.down_proj", "model.layers.4.mlp.experts.117.down_proj", "model.layers.4.mlp.experts.118.down_proj", "model.layers.4.mlp.experts.119.down_proj", "model.layers.4.mlp.experts.120.down_proj", "model.layers.4.mlp.experts.121.down_proj", "model.layers.4.mlp.experts.122.down_proj", "model.layers.4.mlp.experts.123.down_proj", "model.layers.4.mlp.experts.124.down_proj", "model.layers.4.mlp.experts.125.down_proj", "model.layers.4.mlp.experts.126.down_proj", "model.layers.4.mlp.experts.127.down_proj", "model.layers.4.mlp.experts.128.down_proj", "model.layers.4.mlp.experts.129.down_proj", "model.layers.4.mlp.experts.130.down_proj", "model.layers.4.mlp.experts.131.down_proj", "model.layers.4.mlp.experts.132.down_proj", "model.layers.4.mlp.experts.133.down_proj", "model.layers.4.mlp.experts.134.down_proj", "model.layers.4.mlp.experts.135.down_proj", "model.layers.4.mlp.experts.136.down_proj", "model.layers.4.mlp.experts.137.down_proj", "model.layers.4.mlp.experts.138.down_proj", "model.layers.4.mlp.experts.139.down_proj", "model.layers.4.mlp.experts.140.down_proj", "model.layers.4.mlp.experts.141.down_proj", "model.layers.4.mlp.experts.142.down_proj", "model.layers.4.mlp.experts.143.down_proj", "model.layers.4.mlp.experts.144.down_proj", "model.layers.4.mlp.experts.145.down_proj", "model.layers.4.mlp.experts.146.down_proj", "model.layers.4.mlp.experts.147.down_proj", "model.layers.4.mlp.experts.148.down_proj", "model.layers.4.mlp.experts.149.down_proj", "model.layers.4.mlp.experts.150.down_proj", "model.layers.4.mlp.experts.151.down_proj", "model.layers.4.mlp.experts.152.down_proj", "model.layers.4.mlp.experts.153.down_proj", "model.layers.4.mlp.experts.154.down_proj", "model.layers.4.mlp.experts.155.down_proj", "model.layers.4.mlp.experts.156.down_proj", "model.layers.4.mlp.experts.157.down_proj", "model.layers.4.mlp.experts.158.down_proj", "model.layers.4.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -5.5593578144906564e-05, "dbits": 1258291200 }, { "dkld": -1.995167694985797e-05, "dbits": 2516582400 } ] }, { "idx": 27, "layers": [ "model.layers.5.self_attn.q_proj" ], "candidates": [ { "dkld": -3.822403959929943e-05, "dbits": 62914560 }, { "dkld": -6.195344030856392e-06, "dbits": 125829120 } ] }, { "idx": 28, "layers": [ "model.layers.5.self_attn.k_proj", "model.layers.5.self_attn.v_proj" ], "candidates": [ { "dkld": -3.950998652726273e-05, "dbits": 10485760 }, { "dkld": -7.169949822126778e-06, "dbits": 20971520 } ] }, { "idx": 29, "layers": [ "model.layers.5.self_attn.o_proj" ], "candidates": [ { "dkld": -4.858840256929259e-05, "dbits": 62914560 }, { "dkld": -6.489378865808144e-05, "dbits": 125829120 } ] }, { "idx": 30, "layers": [ "model.layers.5.mlp.shared_experts.gate_proj", "model.layers.5.mlp.shared_experts.up_proj", "model.layers.5.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 1.270580105483532e-05, "dbits": 23592960 }, { "dkld": 3.3957930281759e-05, "dbits": 47185920 } ] }, { "idx": 31, "layers": [ "model.layers.5.mlp.experts.0.gate_proj", "model.layers.5.mlp.experts.1.gate_proj", "model.layers.5.mlp.experts.2.gate_proj", "model.layers.5.mlp.experts.3.gate_proj", "model.layers.5.mlp.experts.4.gate_proj", "model.layers.5.mlp.experts.5.gate_proj", "model.layers.5.mlp.experts.6.gate_proj", "model.layers.5.mlp.experts.7.gate_proj", "model.layers.5.mlp.experts.8.gate_proj", "model.layers.5.mlp.experts.9.gate_proj", "model.layers.5.mlp.experts.10.gate_proj", "model.layers.5.mlp.experts.11.gate_proj", "model.layers.5.mlp.experts.12.gate_proj", "model.layers.5.mlp.experts.13.gate_proj", "model.layers.5.mlp.experts.14.gate_proj", "model.layers.5.mlp.experts.15.gate_proj", "model.layers.5.mlp.experts.16.gate_proj", "model.layers.5.mlp.experts.17.gate_proj", "model.layers.5.mlp.experts.18.gate_proj", "model.layers.5.mlp.experts.19.gate_proj", "model.layers.5.mlp.experts.20.gate_proj", "model.layers.5.mlp.experts.21.gate_proj", "model.layers.5.mlp.experts.22.gate_proj", "model.layers.5.mlp.experts.23.gate_proj", "model.layers.5.mlp.experts.24.gate_proj", "model.layers.5.mlp.experts.25.gate_proj", "model.layers.5.mlp.experts.26.gate_proj", "model.layers.5.mlp.experts.27.gate_proj", "model.layers.5.mlp.experts.28.gate_proj", "model.layers.5.mlp.experts.29.gate_proj", "model.layers.5.mlp.experts.30.gate_proj", "model.layers.5.mlp.experts.31.gate_proj", "model.layers.5.mlp.experts.32.gate_proj", "model.layers.5.mlp.experts.33.gate_proj", "model.layers.5.mlp.experts.34.gate_proj", "model.layers.5.mlp.experts.35.gate_proj", "model.layers.5.mlp.experts.36.gate_proj", "model.layers.5.mlp.experts.37.gate_proj", "model.layers.5.mlp.experts.38.gate_proj", "model.layers.5.mlp.experts.39.gate_proj", "model.layers.5.mlp.experts.40.gate_proj", "model.layers.5.mlp.experts.41.gate_proj", "model.layers.5.mlp.experts.42.gate_proj", "model.layers.5.mlp.experts.43.gate_proj", "model.layers.5.mlp.experts.44.gate_proj", "model.layers.5.mlp.experts.45.gate_proj", "model.layers.5.mlp.experts.46.gate_proj", "model.layers.5.mlp.experts.47.gate_proj", "model.layers.5.mlp.experts.48.gate_proj", "model.layers.5.mlp.experts.49.gate_proj", "model.layers.5.mlp.experts.50.gate_proj", "model.layers.5.mlp.experts.51.gate_proj", "model.layers.5.mlp.experts.52.gate_proj", "model.layers.5.mlp.experts.53.gate_proj", "model.layers.5.mlp.experts.54.gate_proj", "model.layers.5.mlp.experts.55.gate_proj", "model.layers.5.mlp.experts.56.gate_proj", "model.layers.5.mlp.experts.57.gate_proj", "model.layers.5.mlp.experts.58.gate_proj", "model.layers.5.mlp.experts.59.gate_proj", "model.layers.5.mlp.experts.60.gate_proj", "model.layers.5.mlp.experts.61.gate_proj", "model.layers.5.mlp.experts.62.gate_proj", "model.layers.5.mlp.experts.63.gate_proj", "model.layers.5.mlp.experts.64.gate_proj", "model.layers.5.mlp.experts.65.gate_proj", "model.layers.5.mlp.experts.66.gate_proj", "model.layers.5.mlp.experts.67.gate_proj", "model.layers.5.mlp.experts.68.gate_proj", "model.layers.5.mlp.experts.69.gate_proj", "model.layers.5.mlp.experts.70.gate_proj", "model.layers.5.mlp.experts.71.gate_proj", "model.layers.5.mlp.experts.72.gate_proj", "model.layers.5.mlp.experts.73.gate_proj", "model.layers.5.mlp.experts.74.gate_proj", "model.layers.5.mlp.experts.75.gate_proj", "model.layers.5.mlp.experts.76.gate_proj", "model.layers.5.mlp.experts.77.gate_proj", "model.layers.5.mlp.experts.78.gate_proj", "model.layers.5.mlp.experts.79.gate_proj", "model.layers.5.mlp.experts.80.gate_proj", "model.layers.5.mlp.experts.81.gate_proj", "model.layers.5.mlp.experts.82.gate_proj", "model.layers.5.mlp.experts.83.gate_proj", "model.layers.5.mlp.experts.84.gate_proj", "model.layers.5.mlp.experts.85.gate_proj", "model.layers.5.mlp.experts.86.gate_proj", "model.layers.5.mlp.experts.87.gate_proj", "model.layers.5.mlp.experts.88.gate_proj", "model.layers.5.mlp.experts.89.gate_proj", "model.layers.5.mlp.experts.90.gate_proj", "model.layers.5.mlp.experts.91.gate_proj", "model.layers.5.mlp.experts.92.gate_proj", "model.layers.5.mlp.experts.93.gate_proj", "model.layers.5.mlp.experts.94.gate_proj", "model.layers.5.mlp.experts.95.gate_proj", "model.layers.5.mlp.experts.96.gate_proj", "model.layers.5.mlp.experts.97.gate_proj", "model.layers.5.mlp.experts.98.gate_proj", "model.layers.5.mlp.experts.99.gate_proj", "model.layers.5.mlp.experts.100.gate_proj", "model.layers.5.mlp.experts.101.gate_proj", "model.layers.5.mlp.experts.102.gate_proj", "model.layers.5.mlp.experts.103.gate_proj", "model.layers.5.mlp.experts.104.gate_proj", "model.layers.5.mlp.experts.105.gate_proj", "model.layers.5.mlp.experts.106.gate_proj", "model.layers.5.mlp.experts.107.gate_proj", "model.layers.5.mlp.experts.108.gate_proj", "model.layers.5.mlp.experts.109.gate_proj", "model.layers.5.mlp.experts.110.gate_proj", "model.layers.5.mlp.experts.111.gate_proj", "model.layers.5.mlp.experts.112.gate_proj", "model.layers.5.mlp.experts.113.gate_proj", "model.layers.5.mlp.experts.114.gate_proj", "model.layers.5.mlp.experts.115.gate_proj", "model.layers.5.mlp.experts.116.gate_proj", "model.layers.5.mlp.experts.117.gate_proj", "model.layers.5.mlp.experts.118.gate_proj", "model.layers.5.mlp.experts.119.gate_proj", "model.layers.5.mlp.experts.120.gate_proj", "model.layers.5.mlp.experts.121.gate_proj", "model.layers.5.mlp.experts.122.gate_proj", "model.layers.5.mlp.experts.123.gate_proj", "model.layers.5.mlp.experts.124.gate_proj", "model.layers.5.mlp.experts.125.gate_proj", "model.layers.5.mlp.experts.126.gate_proj", "model.layers.5.mlp.experts.127.gate_proj", "model.layers.5.mlp.experts.128.gate_proj", "model.layers.5.mlp.experts.129.gate_proj", "model.layers.5.mlp.experts.130.gate_proj", "model.layers.5.mlp.experts.131.gate_proj", "model.layers.5.mlp.experts.132.gate_proj", "model.layers.5.mlp.experts.133.gate_proj", "model.layers.5.mlp.experts.134.gate_proj", "model.layers.5.mlp.experts.135.gate_proj", "model.layers.5.mlp.experts.136.gate_proj", "model.layers.5.mlp.experts.137.gate_proj", "model.layers.5.mlp.experts.138.gate_proj", "model.layers.5.mlp.experts.139.gate_proj", "model.layers.5.mlp.experts.140.gate_proj", "model.layers.5.mlp.experts.141.gate_proj", "model.layers.5.mlp.experts.142.gate_proj", "model.layers.5.mlp.experts.143.gate_proj", "model.layers.5.mlp.experts.144.gate_proj", "model.layers.5.mlp.experts.145.gate_proj", "model.layers.5.mlp.experts.146.gate_proj", "model.layers.5.mlp.experts.147.gate_proj", "model.layers.5.mlp.experts.148.gate_proj", "model.layers.5.mlp.experts.149.gate_proj", "model.layers.5.mlp.experts.150.gate_proj", "model.layers.5.mlp.experts.151.gate_proj", "model.layers.5.mlp.experts.152.gate_proj", "model.layers.5.mlp.experts.153.gate_proj", "model.layers.5.mlp.experts.154.gate_proj", "model.layers.5.mlp.experts.155.gate_proj", "model.layers.5.mlp.experts.156.gate_proj", "model.layers.5.mlp.experts.157.gate_proj", "model.layers.5.mlp.experts.158.gate_proj", "model.layers.5.mlp.experts.159.gate_proj", "model.layers.5.mlp.experts.0.up_proj", "model.layers.5.mlp.experts.1.up_proj", "model.layers.5.mlp.experts.2.up_proj", "model.layers.5.mlp.experts.3.up_proj", "model.layers.5.mlp.experts.4.up_proj", "model.layers.5.mlp.experts.5.up_proj", "model.layers.5.mlp.experts.6.up_proj", "model.layers.5.mlp.experts.7.up_proj", "model.layers.5.mlp.experts.8.up_proj", "model.layers.5.mlp.experts.9.up_proj", "model.layers.5.mlp.experts.10.up_proj", "model.layers.5.mlp.experts.11.up_proj", "model.layers.5.mlp.experts.12.up_proj", "model.layers.5.mlp.experts.13.up_proj", "model.layers.5.mlp.experts.14.up_proj", "model.layers.5.mlp.experts.15.up_proj", "model.layers.5.mlp.experts.16.up_proj", "model.layers.5.mlp.experts.17.up_proj", "model.layers.5.mlp.experts.18.up_proj", "model.layers.5.mlp.experts.19.up_proj", "model.layers.5.mlp.experts.20.up_proj", "model.layers.5.mlp.experts.21.up_proj", "model.layers.5.mlp.experts.22.up_proj", "model.layers.5.mlp.experts.23.up_proj", "model.layers.5.mlp.experts.24.up_proj", "model.layers.5.mlp.experts.25.up_proj", "model.layers.5.mlp.experts.26.up_proj", "model.layers.5.mlp.experts.27.up_proj", "model.layers.5.mlp.experts.28.up_proj", "model.layers.5.mlp.experts.29.up_proj", "model.layers.5.mlp.experts.30.up_proj", "model.layers.5.mlp.experts.31.up_proj", "model.layers.5.mlp.experts.32.up_proj", "model.layers.5.mlp.experts.33.up_proj", "model.layers.5.mlp.experts.34.up_proj", "model.layers.5.mlp.experts.35.up_proj", "model.layers.5.mlp.experts.36.up_proj", "model.layers.5.mlp.experts.37.up_proj", "model.layers.5.mlp.experts.38.up_proj", "model.layers.5.mlp.experts.39.up_proj", "model.layers.5.mlp.experts.40.up_proj", "model.layers.5.mlp.experts.41.up_proj", "model.layers.5.mlp.experts.42.up_proj", "model.layers.5.mlp.experts.43.up_proj", "model.layers.5.mlp.experts.44.up_proj", "model.layers.5.mlp.experts.45.up_proj", "model.layers.5.mlp.experts.46.up_proj", "model.layers.5.mlp.experts.47.up_proj", "model.layers.5.mlp.experts.48.up_proj", "model.layers.5.mlp.experts.49.up_proj", "model.layers.5.mlp.experts.50.up_proj", "model.layers.5.mlp.experts.51.up_proj", "model.layers.5.mlp.experts.52.up_proj", "model.layers.5.mlp.experts.53.up_proj", "model.layers.5.mlp.experts.54.up_proj", "model.layers.5.mlp.experts.55.up_proj", "model.layers.5.mlp.experts.56.up_proj", "model.layers.5.mlp.experts.57.up_proj", "model.layers.5.mlp.experts.58.up_proj", "model.layers.5.mlp.experts.59.up_proj", "model.layers.5.mlp.experts.60.up_proj", "model.layers.5.mlp.experts.61.up_proj", "model.layers.5.mlp.experts.62.up_proj", "model.layers.5.mlp.experts.63.up_proj", "model.layers.5.mlp.experts.64.up_proj", "model.layers.5.mlp.experts.65.up_proj", "model.layers.5.mlp.experts.66.up_proj", "model.layers.5.mlp.experts.67.up_proj", "model.layers.5.mlp.experts.68.up_proj", "model.layers.5.mlp.experts.69.up_proj", "model.layers.5.mlp.experts.70.up_proj", "model.layers.5.mlp.experts.71.up_proj", "model.layers.5.mlp.experts.72.up_proj", "model.layers.5.mlp.experts.73.up_proj", "model.layers.5.mlp.experts.74.up_proj", "model.layers.5.mlp.experts.75.up_proj", "model.layers.5.mlp.experts.76.up_proj", "model.layers.5.mlp.experts.77.up_proj", "model.layers.5.mlp.experts.78.up_proj", "model.layers.5.mlp.experts.79.up_proj", "model.layers.5.mlp.experts.80.up_proj", "model.layers.5.mlp.experts.81.up_proj", "model.layers.5.mlp.experts.82.up_proj", "model.layers.5.mlp.experts.83.up_proj", "model.layers.5.mlp.experts.84.up_proj", "model.layers.5.mlp.experts.85.up_proj", "model.layers.5.mlp.experts.86.up_proj", "model.layers.5.mlp.experts.87.up_proj", "model.layers.5.mlp.experts.88.up_proj", "model.layers.5.mlp.experts.89.up_proj", "model.layers.5.mlp.experts.90.up_proj", "model.layers.5.mlp.experts.91.up_proj", "model.layers.5.mlp.experts.92.up_proj", "model.layers.5.mlp.experts.93.up_proj", "model.layers.5.mlp.experts.94.up_proj", "model.layers.5.mlp.experts.95.up_proj", "model.layers.5.mlp.experts.96.up_proj", "model.layers.5.mlp.experts.97.up_proj", "model.layers.5.mlp.experts.98.up_proj", "model.layers.5.mlp.experts.99.up_proj", "model.layers.5.mlp.experts.100.up_proj", "model.layers.5.mlp.experts.101.up_proj", "model.layers.5.mlp.experts.102.up_proj", "model.layers.5.mlp.experts.103.up_proj", "model.layers.5.mlp.experts.104.up_proj", "model.layers.5.mlp.experts.105.up_proj", "model.layers.5.mlp.experts.106.up_proj", "model.layers.5.mlp.experts.107.up_proj", "model.layers.5.mlp.experts.108.up_proj", "model.layers.5.mlp.experts.109.up_proj", "model.layers.5.mlp.experts.110.up_proj", "model.layers.5.mlp.experts.111.up_proj", "model.layers.5.mlp.experts.112.up_proj", "model.layers.5.mlp.experts.113.up_proj", "model.layers.5.mlp.experts.114.up_proj", "model.layers.5.mlp.experts.115.up_proj", "model.layers.5.mlp.experts.116.up_proj", "model.layers.5.mlp.experts.117.up_proj", "model.layers.5.mlp.experts.118.up_proj", "model.layers.5.mlp.experts.119.up_proj", "model.layers.5.mlp.experts.120.up_proj", "model.layers.5.mlp.experts.121.up_proj", "model.layers.5.mlp.experts.122.up_proj", "model.layers.5.mlp.experts.123.up_proj", "model.layers.5.mlp.experts.124.up_proj", "model.layers.5.mlp.experts.125.up_proj", "model.layers.5.mlp.experts.126.up_proj", "model.layers.5.mlp.experts.127.up_proj", "model.layers.5.mlp.experts.128.up_proj", "model.layers.5.mlp.experts.129.up_proj", "model.layers.5.mlp.experts.130.up_proj", "model.layers.5.mlp.experts.131.up_proj", "model.layers.5.mlp.experts.132.up_proj", "model.layers.5.mlp.experts.133.up_proj", "model.layers.5.mlp.experts.134.up_proj", "model.layers.5.mlp.experts.135.up_proj", "model.layers.5.mlp.experts.136.up_proj", "model.layers.5.mlp.experts.137.up_proj", "model.layers.5.mlp.experts.138.up_proj", "model.layers.5.mlp.experts.139.up_proj", "model.layers.5.mlp.experts.140.up_proj", "model.layers.5.mlp.experts.141.up_proj", "model.layers.5.mlp.experts.142.up_proj", "model.layers.5.mlp.experts.143.up_proj", "model.layers.5.mlp.experts.144.up_proj", "model.layers.5.mlp.experts.145.up_proj", "model.layers.5.mlp.experts.146.up_proj", "model.layers.5.mlp.experts.147.up_proj", "model.layers.5.mlp.experts.148.up_proj", "model.layers.5.mlp.experts.149.up_proj", "model.layers.5.mlp.experts.150.up_proj", "model.layers.5.mlp.experts.151.up_proj", "model.layers.5.mlp.experts.152.up_proj", "model.layers.5.mlp.experts.153.up_proj", "model.layers.5.mlp.experts.154.up_proj", "model.layers.5.mlp.experts.155.up_proj", "model.layers.5.mlp.experts.156.up_proj", "model.layers.5.mlp.experts.157.up_proj", "model.layers.5.mlp.experts.158.up_proj", "model.layers.5.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -6.6453497856854e-05, "dbits": 2516582400 }, { "dkld": -2.5006826035678387e-05, "dbits": 5033164800 } ] }, { "idx": 32, "layers": [ "model.layers.5.mlp.experts.0.down_proj", "model.layers.5.mlp.experts.1.down_proj", "model.layers.5.mlp.experts.2.down_proj", "model.layers.5.mlp.experts.3.down_proj", "model.layers.5.mlp.experts.4.down_proj", "model.layers.5.mlp.experts.5.down_proj", "model.layers.5.mlp.experts.6.down_proj", "model.layers.5.mlp.experts.7.down_proj", "model.layers.5.mlp.experts.8.down_proj", "model.layers.5.mlp.experts.9.down_proj", "model.layers.5.mlp.experts.10.down_proj", "model.layers.5.mlp.experts.11.down_proj", "model.layers.5.mlp.experts.12.down_proj", "model.layers.5.mlp.experts.13.down_proj", "model.layers.5.mlp.experts.14.down_proj", "model.layers.5.mlp.experts.15.down_proj", "model.layers.5.mlp.experts.16.down_proj", "model.layers.5.mlp.experts.17.down_proj", "model.layers.5.mlp.experts.18.down_proj", "model.layers.5.mlp.experts.19.down_proj", "model.layers.5.mlp.experts.20.down_proj", "model.layers.5.mlp.experts.21.down_proj", "model.layers.5.mlp.experts.22.down_proj", "model.layers.5.mlp.experts.23.down_proj", "model.layers.5.mlp.experts.24.down_proj", "model.layers.5.mlp.experts.25.down_proj", "model.layers.5.mlp.experts.26.down_proj", "model.layers.5.mlp.experts.27.down_proj", "model.layers.5.mlp.experts.28.down_proj", "model.layers.5.mlp.experts.29.down_proj", "model.layers.5.mlp.experts.30.down_proj", "model.layers.5.mlp.experts.31.down_proj", "model.layers.5.mlp.experts.32.down_proj", "model.layers.5.mlp.experts.33.down_proj", "model.layers.5.mlp.experts.34.down_proj", "model.layers.5.mlp.experts.35.down_proj", "model.layers.5.mlp.experts.36.down_proj", "model.layers.5.mlp.experts.37.down_proj", "model.layers.5.mlp.experts.38.down_proj", "model.layers.5.mlp.experts.39.down_proj", "model.layers.5.mlp.experts.40.down_proj", "model.layers.5.mlp.experts.41.down_proj", "model.layers.5.mlp.experts.42.down_proj", "model.layers.5.mlp.experts.43.down_proj", "model.layers.5.mlp.experts.44.down_proj", "model.layers.5.mlp.experts.45.down_proj", "model.layers.5.mlp.experts.46.down_proj", "model.layers.5.mlp.experts.47.down_proj", "model.layers.5.mlp.experts.48.down_proj", "model.layers.5.mlp.experts.49.down_proj", "model.layers.5.mlp.experts.50.down_proj", "model.layers.5.mlp.experts.51.down_proj", "model.layers.5.mlp.experts.52.down_proj", "model.layers.5.mlp.experts.53.down_proj", "model.layers.5.mlp.experts.54.down_proj", "model.layers.5.mlp.experts.55.down_proj", "model.layers.5.mlp.experts.56.down_proj", "model.layers.5.mlp.experts.57.down_proj", "model.layers.5.mlp.experts.58.down_proj", "model.layers.5.mlp.experts.59.down_proj", "model.layers.5.mlp.experts.60.down_proj", "model.layers.5.mlp.experts.61.down_proj", "model.layers.5.mlp.experts.62.down_proj", "model.layers.5.mlp.experts.63.down_proj", "model.layers.5.mlp.experts.64.down_proj", "model.layers.5.mlp.experts.65.down_proj", "model.layers.5.mlp.experts.66.down_proj", "model.layers.5.mlp.experts.67.down_proj", "model.layers.5.mlp.experts.68.down_proj", "model.layers.5.mlp.experts.69.down_proj", "model.layers.5.mlp.experts.70.down_proj", "model.layers.5.mlp.experts.71.down_proj", "model.layers.5.mlp.experts.72.down_proj", "model.layers.5.mlp.experts.73.down_proj", "model.layers.5.mlp.experts.74.down_proj", "model.layers.5.mlp.experts.75.down_proj", "model.layers.5.mlp.experts.76.down_proj", "model.layers.5.mlp.experts.77.down_proj", "model.layers.5.mlp.experts.78.down_proj", "model.layers.5.mlp.experts.79.down_proj", "model.layers.5.mlp.experts.80.down_proj", "model.layers.5.mlp.experts.81.down_proj", "model.layers.5.mlp.experts.82.down_proj", "model.layers.5.mlp.experts.83.down_proj", "model.layers.5.mlp.experts.84.down_proj", "model.layers.5.mlp.experts.85.down_proj", "model.layers.5.mlp.experts.86.down_proj", "model.layers.5.mlp.experts.87.down_proj", "model.layers.5.mlp.experts.88.down_proj", "model.layers.5.mlp.experts.89.down_proj", "model.layers.5.mlp.experts.90.down_proj", "model.layers.5.mlp.experts.91.down_proj", "model.layers.5.mlp.experts.92.down_proj", "model.layers.5.mlp.experts.93.down_proj", "model.layers.5.mlp.experts.94.down_proj", "model.layers.5.mlp.experts.95.down_proj", "model.layers.5.mlp.experts.96.down_proj", "model.layers.5.mlp.experts.97.down_proj", "model.layers.5.mlp.experts.98.down_proj", "model.layers.5.mlp.experts.99.down_proj", "model.layers.5.mlp.experts.100.down_proj", "model.layers.5.mlp.experts.101.down_proj", "model.layers.5.mlp.experts.102.down_proj", "model.layers.5.mlp.experts.103.down_proj", "model.layers.5.mlp.experts.104.down_proj", "model.layers.5.mlp.experts.105.down_proj", "model.layers.5.mlp.experts.106.down_proj", "model.layers.5.mlp.experts.107.down_proj", "model.layers.5.mlp.experts.108.down_proj", "model.layers.5.mlp.experts.109.down_proj", "model.layers.5.mlp.experts.110.down_proj", "model.layers.5.mlp.experts.111.down_proj", "model.layers.5.mlp.experts.112.down_proj", "model.layers.5.mlp.experts.113.down_proj", "model.layers.5.mlp.experts.114.down_proj", "model.layers.5.mlp.experts.115.down_proj", "model.layers.5.mlp.experts.116.down_proj", "model.layers.5.mlp.experts.117.down_proj", "model.layers.5.mlp.experts.118.down_proj", "model.layers.5.mlp.experts.119.down_proj", "model.layers.5.mlp.experts.120.down_proj", "model.layers.5.mlp.experts.121.down_proj", "model.layers.5.mlp.experts.122.down_proj", "model.layers.5.mlp.experts.123.down_proj", "model.layers.5.mlp.experts.124.down_proj", "model.layers.5.mlp.experts.125.down_proj", "model.layers.5.mlp.experts.126.down_proj", "model.layers.5.mlp.experts.127.down_proj", "model.layers.5.mlp.experts.128.down_proj", "model.layers.5.mlp.experts.129.down_proj", "model.layers.5.mlp.experts.130.down_proj", "model.layers.5.mlp.experts.131.down_proj", "model.layers.5.mlp.experts.132.down_proj", "model.layers.5.mlp.experts.133.down_proj", "model.layers.5.mlp.experts.134.down_proj", "model.layers.5.mlp.experts.135.down_proj", "model.layers.5.mlp.experts.136.down_proj", "model.layers.5.mlp.experts.137.down_proj", "model.layers.5.mlp.experts.138.down_proj", "model.layers.5.mlp.experts.139.down_proj", "model.layers.5.mlp.experts.140.down_proj", "model.layers.5.mlp.experts.141.down_proj", "model.layers.5.mlp.experts.142.down_proj", "model.layers.5.mlp.experts.143.down_proj", "model.layers.5.mlp.experts.144.down_proj", "model.layers.5.mlp.experts.145.down_proj", "model.layers.5.mlp.experts.146.down_proj", "model.layers.5.mlp.experts.147.down_proj", "model.layers.5.mlp.experts.148.down_proj", "model.layers.5.mlp.experts.149.down_proj", "model.layers.5.mlp.experts.150.down_proj", "model.layers.5.mlp.experts.151.down_proj", "model.layers.5.mlp.experts.152.down_proj", "model.layers.5.mlp.experts.153.down_proj", "model.layers.5.mlp.experts.154.down_proj", "model.layers.5.mlp.experts.155.down_proj", "model.layers.5.mlp.experts.156.down_proj", "model.layers.5.mlp.experts.157.down_proj", "model.layers.5.mlp.experts.158.down_proj", "model.layers.5.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -3.9448426105080994e-05, "dbits": 1258291200 }, { "dkld": -0.00010573484469205037, "dbits": 2516582400 } ] }, { "idx": 33, "layers": [ "model.layers.6.self_attn.q_proj" ], "candidates": [ { "dkld": 4.071928560734836e-06, "dbits": 62914560 }, { "dkld": -2.0664557814596696e-05, "dbits": 125829120 } ] }, { "idx": 34, "layers": [ "model.layers.6.self_attn.k_proj", "model.layers.6.self_attn.v_proj" ], "candidates": [ { "dkld": -0.0001267901156097647, "dbits": 10485760 }, { "dkld": -7.202336564660072e-05, "dbits": 20971520 } ] }, { "idx": 35, "layers": [ "model.layers.6.self_attn.o_proj" ], "candidates": [ { "dkld": 1.0191323235632377e-05, "dbits": 62914560 }, { "dkld": -5.016429349780083e-05, "dbits": 125829120 } ] }, { "idx": 36, "layers": [ "model.layers.6.mlp.shared_experts.gate_proj", "model.layers.6.mlp.shared_experts.up_proj", "model.layers.6.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.00011472126934677224, "dbits": 23592960 }, { "dkld": -9.235965553671018e-05, "dbits": 47185920 } ] }, { "idx": 37, "layers": [ "model.layers.6.mlp.experts.0.gate_proj", "model.layers.6.mlp.experts.1.gate_proj", "model.layers.6.mlp.experts.2.gate_proj", "model.layers.6.mlp.experts.3.gate_proj", "model.layers.6.mlp.experts.4.gate_proj", "model.layers.6.mlp.experts.5.gate_proj", "model.layers.6.mlp.experts.6.gate_proj", "model.layers.6.mlp.experts.7.gate_proj", "model.layers.6.mlp.experts.8.gate_proj", "model.layers.6.mlp.experts.9.gate_proj", "model.layers.6.mlp.experts.10.gate_proj", "model.layers.6.mlp.experts.11.gate_proj", "model.layers.6.mlp.experts.12.gate_proj", "model.layers.6.mlp.experts.13.gate_proj", "model.layers.6.mlp.experts.14.gate_proj", "model.layers.6.mlp.experts.15.gate_proj", "model.layers.6.mlp.experts.16.gate_proj", "model.layers.6.mlp.experts.17.gate_proj", "model.layers.6.mlp.experts.18.gate_proj", "model.layers.6.mlp.experts.19.gate_proj", "model.layers.6.mlp.experts.20.gate_proj", "model.layers.6.mlp.experts.21.gate_proj", "model.layers.6.mlp.experts.22.gate_proj", "model.layers.6.mlp.experts.23.gate_proj", "model.layers.6.mlp.experts.24.gate_proj", "model.layers.6.mlp.experts.25.gate_proj", "model.layers.6.mlp.experts.26.gate_proj", "model.layers.6.mlp.experts.27.gate_proj", "model.layers.6.mlp.experts.28.gate_proj", "model.layers.6.mlp.experts.29.gate_proj", "model.layers.6.mlp.experts.30.gate_proj", "model.layers.6.mlp.experts.31.gate_proj", "model.layers.6.mlp.experts.32.gate_proj", "model.layers.6.mlp.experts.33.gate_proj", "model.layers.6.mlp.experts.34.gate_proj", "model.layers.6.mlp.experts.35.gate_proj", "model.layers.6.mlp.experts.36.gate_proj", "model.layers.6.mlp.experts.37.gate_proj", "model.layers.6.mlp.experts.38.gate_proj", "model.layers.6.mlp.experts.39.gate_proj", "model.layers.6.mlp.experts.40.gate_proj", "model.layers.6.mlp.experts.41.gate_proj", "model.layers.6.mlp.experts.42.gate_proj", "model.layers.6.mlp.experts.43.gate_proj", "model.layers.6.mlp.experts.44.gate_proj", "model.layers.6.mlp.experts.45.gate_proj", "model.layers.6.mlp.experts.46.gate_proj", "model.layers.6.mlp.experts.47.gate_proj", "model.layers.6.mlp.experts.48.gate_proj", "model.layers.6.mlp.experts.49.gate_proj", "model.layers.6.mlp.experts.50.gate_proj", "model.layers.6.mlp.experts.51.gate_proj", "model.layers.6.mlp.experts.52.gate_proj", "model.layers.6.mlp.experts.53.gate_proj", "model.layers.6.mlp.experts.54.gate_proj", "model.layers.6.mlp.experts.55.gate_proj", "model.layers.6.mlp.experts.56.gate_proj", "model.layers.6.mlp.experts.57.gate_proj", "model.layers.6.mlp.experts.58.gate_proj", "model.layers.6.mlp.experts.59.gate_proj", "model.layers.6.mlp.experts.60.gate_proj", "model.layers.6.mlp.experts.61.gate_proj", "model.layers.6.mlp.experts.62.gate_proj", "model.layers.6.mlp.experts.63.gate_proj", "model.layers.6.mlp.experts.64.gate_proj", "model.layers.6.mlp.experts.65.gate_proj", "model.layers.6.mlp.experts.66.gate_proj", "model.layers.6.mlp.experts.67.gate_proj", "model.layers.6.mlp.experts.68.gate_proj", "model.layers.6.mlp.experts.69.gate_proj", "model.layers.6.mlp.experts.70.gate_proj", "model.layers.6.mlp.experts.71.gate_proj", "model.layers.6.mlp.experts.72.gate_proj", "model.layers.6.mlp.experts.73.gate_proj", "model.layers.6.mlp.experts.74.gate_proj", "model.layers.6.mlp.experts.75.gate_proj", "model.layers.6.mlp.experts.76.gate_proj", "model.layers.6.mlp.experts.77.gate_proj", "model.layers.6.mlp.experts.78.gate_proj", "model.layers.6.mlp.experts.79.gate_proj", "model.layers.6.mlp.experts.80.gate_proj", "model.layers.6.mlp.experts.81.gate_proj", "model.layers.6.mlp.experts.82.gate_proj", "model.layers.6.mlp.experts.83.gate_proj", "model.layers.6.mlp.experts.84.gate_proj", "model.layers.6.mlp.experts.85.gate_proj", "model.layers.6.mlp.experts.86.gate_proj", "model.layers.6.mlp.experts.87.gate_proj", "model.layers.6.mlp.experts.88.gate_proj", "model.layers.6.mlp.experts.89.gate_proj", "model.layers.6.mlp.experts.90.gate_proj", "model.layers.6.mlp.experts.91.gate_proj", "model.layers.6.mlp.experts.92.gate_proj", "model.layers.6.mlp.experts.93.gate_proj", "model.layers.6.mlp.experts.94.gate_proj", "model.layers.6.mlp.experts.95.gate_proj", "model.layers.6.mlp.experts.96.gate_proj", "model.layers.6.mlp.experts.97.gate_proj", "model.layers.6.mlp.experts.98.gate_proj", "model.layers.6.mlp.experts.99.gate_proj", "model.layers.6.mlp.experts.100.gate_proj", "model.layers.6.mlp.experts.101.gate_proj", "model.layers.6.mlp.experts.102.gate_proj", "model.layers.6.mlp.experts.103.gate_proj", "model.layers.6.mlp.experts.104.gate_proj", "model.layers.6.mlp.experts.105.gate_proj", "model.layers.6.mlp.experts.106.gate_proj", "model.layers.6.mlp.experts.107.gate_proj", "model.layers.6.mlp.experts.108.gate_proj", "model.layers.6.mlp.experts.109.gate_proj", "model.layers.6.mlp.experts.110.gate_proj", "model.layers.6.mlp.experts.111.gate_proj", "model.layers.6.mlp.experts.112.gate_proj", "model.layers.6.mlp.experts.113.gate_proj", "model.layers.6.mlp.experts.114.gate_proj", "model.layers.6.mlp.experts.115.gate_proj", "model.layers.6.mlp.experts.116.gate_proj", "model.layers.6.mlp.experts.117.gate_proj", "model.layers.6.mlp.experts.118.gate_proj", "model.layers.6.mlp.experts.119.gate_proj", "model.layers.6.mlp.experts.120.gate_proj", "model.layers.6.mlp.experts.121.gate_proj", "model.layers.6.mlp.experts.122.gate_proj", "model.layers.6.mlp.experts.123.gate_proj", "model.layers.6.mlp.experts.124.gate_proj", "model.layers.6.mlp.experts.125.gate_proj", "model.layers.6.mlp.experts.126.gate_proj", "model.layers.6.mlp.experts.127.gate_proj", "model.layers.6.mlp.experts.128.gate_proj", "model.layers.6.mlp.experts.129.gate_proj", "model.layers.6.mlp.experts.130.gate_proj", "model.layers.6.mlp.experts.131.gate_proj", "model.layers.6.mlp.experts.132.gate_proj", "model.layers.6.mlp.experts.133.gate_proj", "model.layers.6.mlp.experts.134.gate_proj", "model.layers.6.mlp.experts.135.gate_proj", "model.layers.6.mlp.experts.136.gate_proj", "model.layers.6.mlp.experts.137.gate_proj", "model.layers.6.mlp.experts.138.gate_proj", "model.layers.6.mlp.experts.139.gate_proj", "model.layers.6.mlp.experts.140.gate_proj", "model.layers.6.mlp.experts.141.gate_proj", "model.layers.6.mlp.experts.142.gate_proj", "model.layers.6.mlp.experts.143.gate_proj", "model.layers.6.mlp.experts.144.gate_proj", "model.layers.6.mlp.experts.145.gate_proj", "model.layers.6.mlp.experts.146.gate_proj", "model.layers.6.mlp.experts.147.gate_proj", "model.layers.6.mlp.experts.148.gate_proj", "model.layers.6.mlp.experts.149.gate_proj", "model.layers.6.mlp.experts.150.gate_proj", "model.layers.6.mlp.experts.151.gate_proj", "model.layers.6.mlp.experts.152.gate_proj", "model.layers.6.mlp.experts.153.gate_proj", "model.layers.6.mlp.experts.154.gate_proj", "model.layers.6.mlp.experts.155.gate_proj", "model.layers.6.mlp.experts.156.gate_proj", "model.layers.6.mlp.experts.157.gate_proj", "model.layers.6.mlp.experts.158.gate_proj", "model.layers.6.mlp.experts.159.gate_proj", "model.layers.6.mlp.experts.0.up_proj", "model.layers.6.mlp.experts.1.up_proj", "model.layers.6.mlp.experts.2.up_proj", "model.layers.6.mlp.experts.3.up_proj", "model.layers.6.mlp.experts.4.up_proj", "model.layers.6.mlp.experts.5.up_proj", "model.layers.6.mlp.experts.6.up_proj", "model.layers.6.mlp.experts.7.up_proj", "model.layers.6.mlp.experts.8.up_proj", "model.layers.6.mlp.experts.9.up_proj", "model.layers.6.mlp.experts.10.up_proj", "model.layers.6.mlp.experts.11.up_proj", "model.layers.6.mlp.experts.12.up_proj", "model.layers.6.mlp.experts.13.up_proj", "model.layers.6.mlp.experts.14.up_proj", "model.layers.6.mlp.experts.15.up_proj", "model.layers.6.mlp.experts.16.up_proj", "model.layers.6.mlp.experts.17.up_proj", "model.layers.6.mlp.experts.18.up_proj", "model.layers.6.mlp.experts.19.up_proj", "model.layers.6.mlp.experts.20.up_proj", "model.layers.6.mlp.experts.21.up_proj", "model.layers.6.mlp.experts.22.up_proj", "model.layers.6.mlp.experts.23.up_proj", "model.layers.6.mlp.experts.24.up_proj", "model.layers.6.mlp.experts.25.up_proj", "model.layers.6.mlp.experts.26.up_proj", "model.layers.6.mlp.experts.27.up_proj", "model.layers.6.mlp.experts.28.up_proj", "model.layers.6.mlp.experts.29.up_proj", "model.layers.6.mlp.experts.30.up_proj", "model.layers.6.mlp.experts.31.up_proj", "model.layers.6.mlp.experts.32.up_proj", "model.layers.6.mlp.experts.33.up_proj", "model.layers.6.mlp.experts.34.up_proj", "model.layers.6.mlp.experts.35.up_proj", "model.layers.6.mlp.experts.36.up_proj", "model.layers.6.mlp.experts.37.up_proj", "model.layers.6.mlp.experts.38.up_proj", "model.layers.6.mlp.experts.39.up_proj", "model.layers.6.mlp.experts.40.up_proj", "model.layers.6.mlp.experts.41.up_proj", "model.layers.6.mlp.experts.42.up_proj", "model.layers.6.mlp.experts.43.up_proj", "model.layers.6.mlp.experts.44.up_proj", "model.layers.6.mlp.experts.45.up_proj", "model.layers.6.mlp.experts.46.up_proj", "model.layers.6.mlp.experts.47.up_proj", "model.layers.6.mlp.experts.48.up_proj", "model.layers.6.mlp.experts.49.up_proj", "model.layers.6.mlp.experts.50.up_proj", "model.layers.6.mlp.experts.51.up_proj", "model.layers.6.mlp.experts.52.up_proj", "model.layers.6.mlp.experts.53.up_proj", "model.layers.6.mlp.experts.54.up_proj", "model.layers.6.mlp.experts.55.up_proj", "model.layers.6.mlp.experts.56.up_proj", "model.layers.6.mlp.experts.57.up_proj", "model.layers.6.mlp.experts.58.up_proj", "model.layers.6.mlp.experts.59.up_proj", "model.layers.6.mlp.experts.60.up_proj", "model.layers.6.mlp.experts.61.up_proj", "model.layers.6.mlp.experts.62.up_proj", "model.layers.6.mlp.experts.63.up_proj", "model.layers.6.mlp.experts.64.up_proj", "model.layers.6.mlp.experts.65.up_proj", "model.layers.6.mlp.experts.66.up_proj", "model.layers.6.mlp.experts.67.up_proj", "model.layers.6.mlp.experts.68.up_proj", "model.layers.6.mlp.experts.69.up_proj", "model.layers.6.mlp.experts.70.up_proj", "model.layers.6.mlp.experts.71.up_proj", "model.layers.6.mlp.experts.72.up_proj", "model.layers.6.mlp.experts.73.up_proj", "model.layers.6.mlp.experts.74.up_proj", "model.layers.6.mlp.experts.75.up_proj", "model.layers.6.mlp.experts.76.up_proj", "model.layers.6.mlp.experts.77.up_proj", "model.layers.6.mlp.experts.78.up_proj", "model.layers.6.mlp.experts.79.up_proj", "model.layers.6.mlp.experts.80.up_proj", "model.layers.6.mlp.experts.81.up_proj", "model.layers.6.mlp.experts.82.up_proj", "model.layers.6.mlp.experts.83.up_proj", "model.layers.6.mlp.experts.84.up_proj", "model.layers.6.mlp.experts.85.up_proj", "model.layers.6.mlp.experts.86.up_proj", "model.layers.6.mlp.experts.87.up_proj", "model.layers.6.mlp.experts.88.up_proj", "model.layers.6.mlp.experts.89.up_proj", "model.layers.6.mlp.experts.90.up_proj", "model.layers.6.mlp.experts.91.up_proj", "model.layers.6.mlp.experts.92.up_proj", "model.layers.6.mlp.experts.93.up_proj", "model.layers.6.mlp.experts.94.up_proj", "model.layers.6.mlp.experts.95.up_proj", "model.layers.6.mlp.experts.96.up_proj", "model.layers.6.mlp.experts.97.up_proj", "model.layers.6.mlp.experts.98.up_proj", "model.layers.6.mlp.experts.99.up_proj", "model.layers.6.mlp.experts.100.up_proj", "model.layers.6.mlp.experts.101.up_proj", "model.layers.6.mlp.experts.102.up_proj", "model.layers.6.mlp.experts.103.up_proj", "model.layers.6.mlp.experts.104.up_proj", "model.layers.6.mlp.experts.105.up_proj", "model.layers.6.mlp.experts.106.up_proj", "model.layers.6.mlp.experts.107.up_proj", "model.layers.6.mlp.experts.108.up_proj", "model.layers.6.mlp.experts.109.up_proj", "model.layers.6.mlp.experts.110.up_proj", "model.layers.6.mlp.experts.111.up_proj", "model.layers.6.mlp.experts.112.up_proj", "model.layers.6.mlp.experts.113.up_proj", "model.layers.6.mlp.experts.114.up_proj", "model.layers.6.mlp.experts.115.up_proj", "model.layers.6.mlp.experts.116.up_proj", "model.layers.6.mlp.experts.117.up_proj", "model.layers.6.mlp.experts.118.up_proj", "model.layers.6.mlp.experts.119.up_proj", "model.layers.6.mlp.experts.120.up_proj", "model.layers.6.mlp.experts.121.up_proj", "model.layers.6.mlp.experts.122.up_proj", "model.layers.6.mlp.experts.123.up_proj", "model.layers.6.mlp.experts.124.up_proj", "model.layers.6.mlp.experts.125.up_proj", "model.layers.6.mlp.experts.126.up_proj", "model.layers.6.mlp.experts.127.up_proj", "model.layers.6.mlp.experts.128.up_proj", "model.layers.6.mlp.experts.129.up_proj", "model.layers.6.mlp.experts.130.up_proj", "model.layers.6.mlp.experts.131.up_proj", "model.layers.6.mlp.experts.132.up_proj", "model.layers.6.mlp.experts.133.up_proj", "model.layers.6.mlp.experts.134.up_proj", "model.layers.6.mlp.experts.135.up_proj", "model.layers.6.mlp.experts.136.up_proj", "model.layers.6.mlp.experts.137.up_proj", "model.layers.6.mlp.experts.138.up_proj", "model.layers.6.mlp.experts.139.up_proj", "model.layers.6.mlp.experts.140.up_proj", "model.layers.6.mlp.experts.141.up_proj", "model.layers.6.mlp.experts.142.up_proj", "model.layers.6.mlp.experts.143.up_proj", "model.layers.6.mlp.experts.144.up_proj", "model.layers.6.mlp.experts.145.up_proj", "model.layers.6.mlp.experts.146.up_proj", "model.layers.6.mlp.experts.147.up_proj", "model.layers.6.mlp.experts.148.up_proj", "model.layers.6.mlp.experts.149.up_proj", "model.layers.6.mlp.experts.150.up_proj", "model.layers.6.mlp.experts.151.up_proj", "model.layers.6.mlp.experts.152.up_proj", "model.layers.6.mlp.experts.153.up_proj", "model.layers.6.mlp.experts.154.up_proj", "model.layers.6.mlp.experts.155.up_proj", "model.layers.6.mlp.experts.156.up_proj", "model.layers.6.mlp.experts.157.up_proj", "model.layers.6.mlp.experts.158.up_proj", "model.layers.6.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -7.471246644854407e-05, "dbits": 2516582400 }, { "dkld": -7.78948655351993e-05, "dbits": 5033164800 } ] }, { "idx": 38, "layers": [ "model.layers.6.mlp.experts.0.down_proj", "model.layers.6.mlp.experts.1.down_proj", "model.layers.6.mlp.experts.2.down_proj", "model.layers.6.mlp.experts.3.down_proj", "model.layers.6.mlp.experts.4.down_proj", "model.layers.6.mlp.experts.5.down_proj", "model.layers.6.mlp.experts.6.down_proj", "model.layers.6.mlp.experts.7.down_proj", "model.layers.6.mlp.experts.8.down_proj", "model.layers.6.mlp.experts.9.down_proj", "model.layers.6.mlp.experts.10.down_proj", "model.layers.6.mlp.experts.11.down_proj", "model.layers.6.mlp.experts.12.down_proj", "model.layers.6.mlp.experts.13.down_proj", "model.layers.6.mlp.experts.14.down_proj", "model.layers.6.mlp.experts.15.down_proj", "model.layers.6.mlp.experts.16.down_proj", "model.layers.6.mlp.experts.17.down_proj", "model.layers.6.mlp.experts.18.down_proj", "model.layers.6.mlp.experts.19.down_proj", "model.layers.6.mlp.experts.20.down_proj", "model.layers.6.mlp.experts.21.down_proj", "model.layers.6.mlp.experts.22.down_proj", "model.layers.6.mlp.experts.23.down_proj", "model.layers.6.mlp.experts.24.down_proj", "model.layers.6.mlp.experts.25.down_proj", "model.layers.6.mlp.experts.26.down_proj", "model.layers.6.mlp.experts.27.down_proj", "model.layers.6.mlp.experts.28.down_proj", "model.layers.6.mlp.experts.29.down_proj", "model.layers.6.mlp.experts.30.down_proj", "model.layers.6.mlp.experts.31.down_proj", "model.layers.6.mlp.experts.32.down_proj", "model.layers.6.mlp.experts.33.down_proj", "model.layers.6.mlp.experts.34.down_proj", "model.layers.6.mlp.experts.35.down_proj", "model.layers.6.mlp.experts.36.down_proj", "model.layers.6.mlp.experts.37.down_proj", "model.layers.6.mlp.experts.38.down_proj", "model.layers.6.mlp.experts.39.down_proj", "model.layers.6.mlp.experts.40.down_proj", "model.layers.6.mlp.experts.41.down_proj", "model.layers.6.mlp.experts.42.down_proj", "model.layers.6.mlp.experts.43.down_proj", "model.layers.6.mlp.experts.44.down_proj", "model.layers.6.mlp.experts.45.down_proj", "model.layers.6.mlp.experts.46.down_proj", "model.layers.6.mlp.experts.47.down_proj", "model.layers.6.mlp.experts.48.down_proj", "model.layers.6.mlp.experts.49.down_proj", "model.layers.6.mlp.experts.50.down_proj", "model.layers.6.mlp.experts.51.down_proj", "model.layers.6.mlp.experts.52.down_proj", "model.layers.6.mlp.experts.53.down_proj", "model.layers.6.mlp.experts.54.down_proj", "model.layers.6.mlp.experts.55.down_proj", "model.layers.6.mlp.experts.56.down_proj", "model.layers.6.mlp.experts.57.down_proj", "model.layers.6.mlp.experts.58.down_proj", "model.layers.6.mlp.experts.59.down_proj", "model.layers.6.mlp.experts.60.down_proj", "model.layers.6.mlp.experts.61.down_proj", "model.layers.6.mlp.experts.62.down_proj", "model.layers.6.mlp.experts.63.down_proj", "model.layers.6.mlp.experts.64.down_proj", "model.layers.6.mlp.experts.65.down_proj", "model.layers.6.mlp.experts.66.down_proj", "model.layers.6.mlp.experts.67.down_proj", "model.layers.6.mlp.experts.68.down_proj", "model.layers.6.mlp.experts.69.down_proj", "model.layers.6.mlp.experts.70.down_proj", "model.layers.6.mlp.experts.71.down_proj", "model.layers.6.mlp.experts.72.down_proj", "model.layers.6.mlp.experts.73.down_proj", "model.layers.6.mlp.experts.74.down_proj", "model.layers.6.mlp.experts.75.down_proj", "model.layers.6.mlp.experts.76.down_proj", "model.layers.6.mlp.experts.77.down_proj", "model.layers.6.mlp.experts.78.down_proj", "model.layers.6.mlp.experts.79.down_proj", "model.layers.6.mlp.experts.80.down_proj", "model.layers.6.mlp.experts.81.down_proj", "model.layers.6.mlp.experts.82.down_proj", "model.layers.6.mlp.experts.83.down_proj", "model.layers.6.mlp.experts.84.down_proj", "model.layers.6.mlp.experts.85.down_proj", "model.layers.6.mlp.experts.86.down_proj", "model.layers.6.mlp.experts.87.down_proj", "model.layers.6.mlp.experts.88.down_proj", "model.layers.6.mlp.experts.89.down_proj", "model.layers.6.mlp.experts.90.down_proj", "model.layers.6.mlp.experts.91.down_proj", "model.layers.6.mlp.experts.92.down_proj", "model.layers.6.mlp.experts.93.down_proj", "model.layers.6.mlp.experts.94.down_proj", "model.layers.6.mlp.experts.95.down_proj", "model.layers.6.mlp.experts.96.down_proj", "model.layers.6.mlp.experts.97.down_proj", "model.layers.6.mlp.experts.98.down_proj", "model.layers.6.mlp.experts.99.down_proj", "model.layers.6.mlp.experts.100.down_proj", "model.layers.6.mlp.experts.101.down_proj", "model.layers.6.mlp.experts.102.down_proj", "model.layers.6.mlp.experts.103.down_proj", "model.layers.6.mlp.experts.104.down_proj", "model.layers.6.mlp.experts.105.down_proj", "model.layers.6.mlp.experts.106.down_proj", "model.layers.6.mlp.experts.107.down_proj", "model.layers.6.mlp.experts.108.down_proj", "model.layers.6.mlp.experts.109.down_proj", "model.layers.6.mlp.experts.110.down_proj", "model.layers.6.mlp.experts.111.down_proj", "model.layers.6.mlp.experts.112.down_proj", "model.layers.6.mlp.experts.113.down_proj", "model.layers.6.mlp.experts.114.down_proj", "model.layers.6.mlp.experts.115.down_proj", "model.layers.6.mlp.experts.116.down_proj", "model.layers.6.mlp.experts.117.down_proj", "model.layers.6.mlp.experts.118.down_proj", "model.layers.6.mlp.experts.119.down_proj", "model.layers.6.mlp.experts.120.down_proj", "model.layers.6.mlp.experts.121.down_proj", "model.layers.6.mlp.experts.122.down_proj", "model.layers.6.mlp.experts.123.down_proj", "model.layers.6.mlp.experts.124.down_proj", "model.layers.6.mlp.experts.125.down_proj", "model.layers.6.mlp.experts.126.down_proj", "model.layers.6.mlp.experts.127.down_proj", "model.layers.6.mlp.experts.128.down_proj", "model.layers.6.mlp.experts.129.down_proj", "model.layers.6.mlp.experts.130.down_proj", "model.layers.6.mlp.experts.131.down_proj", "model.layers.6.mlp.experts.132.down_proj", "model.layers.6.mlp.experts.133.down_proj", "model.layers.6.mlp.experts.134.down_proj", "model.layers.6.mlp.experts.135.down_proj", "model.layers.6.mlp.experts.136.down_proj", "model.layers.6.mlp.experts.137.down_proj", "model.layers.6.mlp.experts.138.down_proj", "model.layers.6.mlp.experts.139.down_proj", "model.layers.6.mlp.experts.140.down_proj", "model.layers.6.mlp.experts.141.down_proj", "model.layers.6.mlp.experts.142.down_proj", "model.layers.6.mlp.experts.143.down_proj", "model.layers.6.mlp.experts.144.down_proj", "model.layers.6.mlp.experts.145.down_proj", "model.layers.6.mlp.experts.146.down_proj", "model.layers.6.mlp.experts.147.down_proj", "model.layers.6.mlp.experts.148.down_proj", "model.layers.6.mlp.experts.149.down_proj", "model.layers.6.mlp.experts.150.down_proj", "model.layers.6.mlp.experts.151.down_proj", "model.layers.6.mlp.experts.152.down_proj", "model.layers.6.mlp.experts.153.down_proj", "model.layers.6.mlp.experts.154.down_proj", "model.layers.6.mlp.experts.155.down_proj", "model.layers.6.mlp.experts.156.down_proj", "model.layers.6.mlp.experts.157.down_proj", "model.layers.6.mlp.experts.158.down_proj", "model.layers.6.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -4.9968203529714844e-05, "dbits": 1258291200 }, { "dkld": -2.8745643794535203e-05, "dbits": 2516582400 } ] }, { "idx": 39, "layers": [ "model.layers.7.self_attn.q_proj" ], "candidates": [ { "dkld": -3.7848437204956314e-05, "dbits": 62914560 }, { "dkld": -3.71114350855347e-05, "dbits": 125829120 } ] }, { "idx": 40, "layers": [ "model.layers.7.self_attn.k_proj", "model.layers.7.self_attn.v_proj" ], "candidates": [ { "dkld": 9.451992809772491e-06, "dbits": 10485760 }, { "dkld": -2.0727934315799973e-05, "dbits": 20971520 } ] }, { "idx": 41, "layers": [ "model.layers.7.self_attn.o_proj" ], "candidates": [ { "dkld": -6.601614877581492e-05, "dbits": 62914560 }, { "dkld": -6.86295796185725e-05, "dbits": 125829120 } ] }, { "idx": 42, "layers": [ "model.layers.7.mlp.shared_experts.gate_proj", "model.layers.7.mlp.shared_experts.up_proj", "model.layers.7.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -3.018300049006939e-06, "dbits": 23592960 }, { "dkld": -2.1181069314479828e-05, "dbits": 47185920 } ] }, { "idx": 43, "layers": [ "model.layers.7.mlp.experts.0.gate_proj", "model.layers.7.mlp.experts.1.gate_proj", "model.layers.7.mlp.experts.2.gate_proj", "model.layers.7.mlp.experts.3.gate_proj", "model.layers.7.mlp.experts.4.gate_proj", "model.layers.7.mlp.experts.5.gate_proj", "model.layers.7.mlp.experts.6.gate_proj", "model.layers.7.mlp.experts.7.gate_proj", "model.layers.7.mlp.experts.8.gate_proj", "model.layers.7.mlp.experts.9.gate_proj", "model.layers.7.mlp.experts.10.gate_proj", "model.layers.7.mlp.experts.11.gate_proj", "model.layers.7.mlp.experts.12.gate_proj", "model.layers.7.mlp.experts.13.gate_proj", "model.layers.7.mlp.experts.14.gate_proj", "model.layers.7.mlp.experts.15.gate_proj", "model.layers.7.mlp.experts.16.gate_proj", "model.layers.7.mlp.experts.17.gate_proj", "model.layers.7.mlp.experts.18.gate_proj", "model.layers.7.mlp.experts.19.gate_proj", "model.layers.7.mlp.experts.20.gate_proj", "model.layers.7.mlp.experts.21.gate_proj", "model.layers.7.mlp.experts.22.gate_proj", "model.layers.7.mlp.experts.23.gate_proj", "model.layers.7.mlp.experts.24.gate_proj", "model.layers.7.mlp.experts.25.gate_proj", "model.layers.7.mlp.experts.26.gate_proj", "model.layers.7.mlp.experts.27.gate_proj", "model.layers.7.mlp.experts.28.gate_proj", "model.layers.7.mlp.experts.29.gate_proj", "model.layers.7.mlp.experts.30.gate_proj", "model.layers.7.mlp.experts.31.gate_proj", "model.layers.7.mlp.experts.32.gate_proj", "model.layers.7.mlp.experts.33.gate_proj", "model.layers.7.mlp.experts.34.gate_proj", "model.layers.7.mlp.experts.35.gate_proj", "model.layers.7.mlp.experts.36.gate_proj", "model.layers.7.mlp.experts.37.gate_proj", "model.layers.7.mlp.experts.38.gate_proj", "model.layers.7.mlp.experts.39.gate_proj", "model.layers.7.mlp.experts.40.gate_proj", "model.layers.7.mlp.experts.41.gate_proj", "model.layers.7.mlp.experts.42.gate_proj", "model.layers.7.mlp.experts.43.gate_proj", "model.layers.7.mlp.experts.44.gate_proj", "model.layers.7.mlp.experts.45.gate_proj", "model.layers.7.mlp.experts.46.gate_proj", "model.layers.7.mlp.experts.47.gate_proj", "model.layers.7.mlp.experts.48.gate_proj", "model.layers.7.mlp.experts.49.gate_proj", "model.layers.7.mlp.experts.50.gate_proj", "model.layers.7.mlp.experts.51.gate_proj", "model.layers.7.mlp.experts.52.gate_proj", "model.layers.7.mlp.experts.53.gate_proj", "model.layers.7.mlp.experts.54.gate_proj", "model.layers.7.mlp.experts.55.gate_proj", "model.layers.7.mlp.experts.56.gate_proj", "model.layers.7.mlp.experts.57.gate_proj", "model.layers.7.mlp.experts.58.gate_proj", "model.layers.7.mlp.experts.59.gate_proj", "model.layers.7.mlp.experts.60.gate_proj", "model.layers.7.mlp.experts.61.gate_proj", "model.layers.7.mlp.experts.62.gate_proj", "model.layers.7.mlp.experts.63.gate_proj", "model.layers.7.mlp.experts.64.gate_proj", "model.layers.7.mlp.experts.65.gate_proj", "model.layers.7.mlp.experts.66.gate_proj", "model.layers.7.mlp.experts.67.gate_proj", "model.layers.7.mlp.experts.68.gate_proj", "model.layers.7.mlp.experts.69.gate_proj", "model.layers.7.mlp.experts.70.gate_proj", "model.layers.7.mlp.experts.71.gate_proj", "model.layers.7.mlp.experts.72.gate_proj", "model.layers.7.mlp.experts.73.gate_proj", "model.layers.7.mlp.experts.74.gate_proj", "model.layers.7.mlp.experts.75.gate_proj", "model.layers.7.mlp.experts.76.gate_proj", "model.layers.7.mlp.experts.77.gate_proj", "model.layers.7.mlp.experts.78.gate_proj", "model.layers.7.mlp.experts.79.gate_proj", "model.layers.7.mlp.experts.80.gate_proj", "model.layers.7.mlp.experts.81.gate_proj", "model.layers.7.mlp.experts.82.gate_proj", "model.layers.7.mlp.experts.83.gate_proj", "model.layers.7.mlp.experts.84.gate_proj", "model.layers.7.mlp.experts.85.gate_proj", "model.layers.7.mlp.experts.86.gate_proj", "model.layers.7.mlp.experts.87.gate_proj", "model.layers.7.mlp.experts.88.gate_proj", "model.layers.7.mlp.experts.89.gate_proj", "model.layers.7.mlp.experts.90.gate_proj", "model.layers.7.mlp.experts.91.gate_proj", "model.layers.7.mlp.experts.92.gate_proj", "model.layers.7.mlp.experts.93.gate_proj", "model.layers.7.mlp.experts.94.gate_proj", "model.layers.7.mlp.experts.95.gate_proj", "model.layers.7.mlp.experts.96.gate_proj", "model.layers.7.mlp.experts.97.gate_proj", "model.layers.7.mlp.experts.98.gate_proj", "model.layers.7.mlp.experts.99.gate_proj", "model.layers.7.mlp.experts.100.gate_proj", "model.layers.7.mlp.experts.101.gate_proj", "model.layers.7.mlp.experts.102.gate_proj", "model.layers.7.mlp.experts.103.gate_proj", "model.layers.7.mlp.experts.104.gate_proj", "model.layers.7.mlp.experts.105.gate_proj", "model.layers.7.mlp.experts.106.gate_proj", "model.layers.7.mlp.experts.107.gate_proj", "model.layers.7.mlp.experts.108.gate_proj", "model.layers.7.mlp.experts.109.gate_proj", "model.layers.7.mlp.experts.110.gate_proj", "model.layers.7.mlp.experts.111.gate_proj", "model.layers.7.mlp.experts.112.gate_proj", "model.layers.7.mlp.experts.113.gate_proj", "model.layers.7.mlp.experts.114.gate_proj", "model.layers.7.mlp.experts.115.gate_proj", "model.layers.7.mlp.experts.116.gate_proj", "model.layers.7.mlp.experts.117.gate_proj", "model.layers.7.mlp.experts.118.gate_proj", "model.layers.7.mlp.experts.119.gate_proj", "model.layers.7.mlp.experts.120.gate_proj", "model.layers.7.mlp.experts.121.gate_proj", "model.layers.7.mlp.experts.122.gate_proj", "model.layers.7.mlp.experts.123.gate_proj", "model.layers.7.mlp.experts.124.gate_proj", "model.layers.7.mlp.experts.125.gate_proj", "model.layers.7.mlp.experts.126.gate_proj", "model.layers.7.mlp.experts.127.gate_proj", "model.layers.7.mlp.experts.128.gate_proj", "model.layers.7.mlp.experts.129.gate_proj", "model.layers.7.mlp.experts.130.gate_proj", "model.layers.7.mlp.experts.131.gate_proj", "model.layers.7.mlp.experts.132.gate_proj", "model.layers.7.mlp.experts.133.gate_proj", "model.layers.7.mlp.experts.134.gate_proj", "model.layers.7.mlp.experts.135.gate_proj", "model.layers.7.mlp.experts.136.gate_proj", "model.layers.7.mlp.experts.137.gate_proj", "model.layers.7.mlp.experts.138.gate_proj", "model.layers.7.mlp.experts.139.gate_proj", "model.layers.7.mlp.experts.140.gate_proj", "model.layers.7.mlp.experts.141.gate_proj", "model.layers.7.mlp.experts.142.gate_proj", "model.layers.7.mlp.experts.143.gate_proj", "model.layers.7.mlp.experts.144.gate_proj", "model.layers.7.mlp.experts.145.gate_proj", "model.layers.7.mlp.experts.146.gate_proj", "model.layers.7.mlp.experts.147.gate_proj", "model.layers.7.mlp.experts.148.gate_proj", "model.layers.7.mlp.experts.149.gate_proj", "model.layers.7.mlp.experts.150.gate_proj", "model.layers.7.mlp.experts.151.gate_proj", "model.layers.7.mlp.experts.152.gate_proj", "model.layers.7.mlp.experts.153.gate_proj", "model.layers.7.mlp.experts.154.gate_proj", "model.layers.7.mlp.experts.155.gate_proj", "model.layers.7.mlp.experts.156.gate_proj", "model.layers.7.mlp.experts.157.gate_proj", "model.layers.7.mlp.experts.158.gate_proj", "model.layers.7.mlp.experts.159.gate_proj", "model.layers.7.mlp.experts.0.up_proj", "model.layers.7.mlp.experts.1.up_proj", "model.layers.7.mlp.experts.2.up_proj", "model.layers.7.mlp.experts.3.up_proj", "model.layers.7.mlp.experts.4.up_proj", "model.layers.7.mlp.experts.5.up_proj", "model.layers.7.mlp.experts.6.up_proj", "model.layers.7.mlp.experts.7.up_proj", "model.layers.7.mlp.experts.8.up_proj", "model.layers.7.mlp.experts.9.up_proj", "model.layers.7.mlp.experts.10.up_proj", "model.layers.7.mlp.experts.11.up_proj", "model.layers.7.mlp.experts.12.up_proj", "model.layers.7.mlp.experts.13.up_proj", "model.layers.7.mlp.experts.14.up_proj", "model.layers.7.mlp.experts.15.up_proj", "model.layers.7.mlp.experts.16.up_proj", "model.layers.7.mlp.experts.17.up_proj", "model.layers.7.mlp.experts.18.up_proj", "model.layers.7.mlp.experts.19.up_proj", "model.layers.7.mlp.experts.20.up_proj", "model.layers.7.mlp.experts.21.up_proj", "model.layers.7.mlp.experts.22.up_proj", "model.layers.7.mlp.experts.23.up_proj", "model.layers.7.mlp.experts.24.up_proj", "model.layers.7.mlp.experts.25.up_proj", "model.layers.7.mlp.experts.26.up_proj", "model.layers.7.mlp.experts.27.up_proj", "model.layers.7.mlp.experts.28.up_proj", "model.layers.7.mlp.experts.29.up_proj", "model.layers.7.mlp.experts.30.up_proj", "model.layers.7.mlp.experts.31.up_proj", "model.layers.7.mlp.experts.32.up_proj", "model.layers.7.mlp.experts.33.up_proj", "model.layers.7.mlp.experts.34.up_proj", "model.layers.7.mlp.experts.35.up_proj", "model.layers.7.mlp.experts.36.up_proj", "model.layers.7.mlp.experts.37.up_proj", "model.layers.7.mlp.experts.38.up_proj", "model.layers.7.mlp.experts.39.up_proj", "model.layers.7.mlp.experts.40.up_proj", "model.layers.7.mlp.experts.41.up_proj", "model.layers.7.mlp.experts.42.up_proj", "model.layers.7.mlp.experts.43.up_proj", "model.layers.7.mlp.experts.44.up_proj", "model.layers.7.mlp.experts.45.up_proj", "model.layers.7.mlp.experts.46.up_proj", "model.layers.7.mlp.experts.47.up_proj", "model.layers.7.mlp.experts.48.up_proj", "model.layers.7.mlp.experts.49.up_proj", "model.layers.7.mlp.experts.50.up_proj", "model.layers.7.mlp.experts.51.up_proj", "model.layers.7.mlp.experts.52.up_proj", "model.layers.7.mlp.experts.53.up_proj", "model.layers.7.mlp.experts.54.up_proj", "model.layers.7.mlp.experts.55.up_proj", "model.layers.7.mlp.experts.56.up_proj", "model.layers.7.mlp.experts.57.up_proj", "model.layers.7.mlp.experts.58.up_proj", "model.layers.7.mlp.experts.59.up_proj", "model.layers.7.mlp.experts.60.up_proj", "model.layers.7.mlp.experts.61.up_proj", "model.layers.7.mlp.experts.62.up_proj", "model.layers.7.mlp.experts.63.up_proj", "model.layers.7.mlp.experts.64.up_proj", "model.layers.7.mlp.experts.65.up_proj", "model.layers.7.mlp.experts.66.up_proj", "model.layers.7.mlp.experts.67.up_proj", "model.layers.7.mlp.experts.68.up_proj", "model.layers.7.mlp.experts.69.up_proj", "model.layers.7.mlp.experts.70.up_proj", "model.layers.7.mlp.experts.71.up_proj", "model.layers.7.mlp.experts.72.up_proj", "model.layers.7.mlp.experts.73.up_proj", "model.layers.7.mlp.experts.74.up_proj", "model.layers.7.mlp.experts.75.up_proj", "model.layers.7.mlp.experts.76.up_proj", "model.layers.7.mlp.experts.77.up_proj", "model.layers.7.mlp.experts.78.up_proj", "model.layers.7.mlp.experts.79.up_proj", "model.layers.7.mlp.experts.80.up_proj", "model.layers.7.mlp.experts.81.up_proj", "model.layers.7.mlp.experts.82.up_proj", "model.layers.7.mlp.experts.83.up_proj", "model.layers.7.mlp.experts.84.up_proj", "model.layers.7.mlp.experts.85.up_proj", "model.layers.7.mlp.experts.86.up_proj", "model.layers.7.mlp.experts.87.up_proj", "model.layers.7.mlp.experts.88.up_proj", "model.layers.7.mlp.experts.89.up_proj", "model.layers.7.mlp.experts.90.up_proj", "model.layers.7.mlp.experts.91.up_proj", "model.layers.7.mlp.experts.92.up_proj", "model.layers.7.mlp.experts.93.up_proj", "model.layers.7.mlp.experts.94.up_proj", "model.layers.7.mlp.experts.95.up_proj", "model.layers.7.mlp.experts.96.up_proj", "model.layers.7.mlp.experts.97.up_proj", "model.layers.7.mlp.experts.98.up_proj", "model.layers.7.mlp.experts.99.up_proj", "model.layers.7.mlp.experts.100.up_proj", "model.layers.7.mlp.experts.101.up_proj", "model.layers.7.mlp.experts.102.up_proj", "model.layers.7.mlp.experts.103.up_proj", "model.layers.7.mlp.experts.104.up_proj", "model.layers.7.mlp.experts.105.up_proj", "model.layers.7.mlp.experts.106.up_proj", "model.layers.7.mlp.experts.107.up_proj", "model.layers.7.mlp.experts.108.up_proj", "model.layers.7.mlp.experts.109.up_proj", "model.layers.7.mlp.experts.110.up_proj", "model.layers.7.mlp.experts.111.up_proj", "model.layers.7.mlp.experts.112.up_proj", "model.layers.7.mlp.experts.113.up_proj", "model.layers.7.mlp.experts.114.up_proj", "model.layers.7.mlp.experts.115.up_proj", "model.layers.7.mlp.experts.116.up_proj", "model.layers.7.mlp.experts.117.up_proj", "model.layers.7.mlp.experts.118.up_proj", "model.layers.7.mlp.experts.119.up_proj", "model.layers.7.mlp.experts.120.up_proj", "model.layers.7.mlp.experts.121.up_proj", "model.layers.7.mlp.experts.122.up_proj", "model.layers.7.mlp.experts.123.up_proj", "model.layers.7.mlp.experts.124.up_proj", "model.layers.7.mlp.experts.125.up_proj", "model.layers.7.mlp.experts.126.up_proj", "model.layers.7.mlp.experts.127.up_proj", "model.layers.7.mlp.experts.128.up_proj", "model.layers.7.mlp.experts.129.up_proj", "model.layers.7.mlp.experts.130.up_proj", "model.layers.7.mlp.experts.131.up_proj", "model.layers.7.mlp.experts.132.up_proj", "model.layers.7.mlp.experts.133.up_proj", "model.layers.7.mlp.experts.134.up_proj", "model.layers.7.mlp.experts.135.up_proj", "model.layers.7.mlp.experts.136.up_proj", "model.layers.7.mlp.experts.137.up_proj", "model.layers.7.mlp.experts.138.up_proj", "model.layers.7.mlp.experts.139.up_proj", "model.layers.7.mlp.experts.140.up_proj", "model.layers.7.mlp.experts.141.up_proj", "model.layers.7.mlp.experts.142.up_proj", "model.layers.7.mlp.experts.143.up_proj", "model.layers.7.mlp.experts.144.up_proj", "model.layers.7.mlp.experts.145.up_proj", "model.layers.7.mlp.experts.146.up_proj", "model.layers.7.mlp.experts.147.up_proj", "model.layers.7.mlp.experts.148.up_proj", "model.layers.7.mlp.experts.149.up_proj", "model.layers.7.mlp.experts.150.up_proj", "model.layers.7.mlp.experts.151.up_proj", "model.layers.7.mlp.experts.152.up_proj", "model.layers.7.mlp.experts.153.up_proj", "model.layers.7.mlp.experts.154.up_proj", "model.layers.7.mlp.experts.155.up_proj", "model.layers.7.mlp.experts.156.up_proj", "model.layers.7.mlp.experts.157.up_proj", "model.layers.7.mlp.experts.158.up_proj", "model.layers.7.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.5651714056728883e-05, "dbits": 2516582400 }, { "dkld": -3.2809912227094173e-05, "dbits": 5033164800 } ] }, { "idx": 44, "layers": [ "model.layers.7.mlp.experts.0.down_proj", "model.layers.7.mlp.experts.1.down_proj", "model.layers.7.mlp.experts.2.down_proj", "model.layers.7.mlp.experts.3.down_proj", "model.layers.7.mlp.experts.4.down_proj", "model.layers.7.mlp.experts.5.down_proj", "model.layers.7.mlp.experts.6.down_proj", "model.layers.7.mlp.experts.7.down_proj", "model.layers.7.mlp.experts.8.down_proj", "model.layers.7.mlp.experts.9.down_proj", "model.layers.7.mlp.experts.10.down_proj", "model.layers.7.mlp.experts.11.down_proj", "model.layers.7.mlp.experts.12.down_proj", "model.layers.7.mlp.experts.13.down_proj", "model.layers.7.mlp.experts.14.down_proj", "model.layers.7.mlp.experts.15.down_proj", "model.layers.7.mlp.experts.16.down_proj", "model.layers.7.mlp.experts.17.down_proj", "model.layers.7.mlp.experts.18.down_proj", "model.layers.7.mlp.experts.19.down_proj", "model.layers.7.mlp.experts.20.down_proj", "model.layers.7.mlp.experts.21.down_proj", "model.layers.7.mlp.experts.22.down_proj", "model.layers.7.mlp.experts.23.down_proj", "model.layers.7.mlp.experts.24.down_proj", "model.layers.7.mlp.experts.25.down_proj", "model.layers.7.mlp.experts.26.down_proj", "model.layers.7.mlp.experts.27.down_proj", "model.layers.7.mlp.experts.28.down_proj", "model.layers.7.mlp.experts.29.down_proj", "model.layers.7.mlp.experts.30.down_proj", "model.layers.7.mlp.experts.31.down_proj", "model.layers.7.mlp.experts.32.down_proj", "model.layers.7.mlp.experts.33.down_proj", "model.layers.7.mlp.experts.34.down_proj", "model.layers.7.mlp.experts.35.down_proj", "model.layers.7.mlp.experts.36.down_proj", "model.layers.7.mlp.experts.37.down_proj", "model.layers.7.mlp.experts.38.down_proj", "model.layers.7.mlp.experts.39.down_proj", "model.layers.7.mlp.experts.40.down_proj", "model.layers.7.mlp.experts.41.down_proj", "model.layers.7.mlp.experts.42.down_proj", "model.layers.7.mlp.experts.43.down_proj", "model.layers.7.mlp.experts.44.down_proj", "model.layers.7.mlp.experts.45.down_proj", "model.layers.7.mlp.experts.46.down_proj", "model.layers.7.mlp.experts.47.down_proj", "model.layers.7.mlp.experts.48.down_proj", "model.layers.7.mlp.experts.49.down_proj", "model.layers.7.mlp.experts.50.down_proj", "model.layers.7.mlp.experts.51.down_proj", "model.layers.7.mlp.experts.52.down_proj", "model.layers.7.mlp.experts.53.down_proj", "model.layers.7.mlp.experts.54.down_proj", "model.layers.7.mlp.experts.55.down_proj", "model.layers.7.mlp.experts.56.down_proj", "model.layers.7.mlp.experts.57.down_proj", "model.layers.7.mlp.experts.58.down_proj", "model.layers.7.mlp.experts.59.down_proj", "model.layers.7.mlp.experts.60.down_proj", "model.layers.7.mlp.experts.61.down_proj", "model.layers.7.mlp.experts.62.down_proj", "model.layers.7.mlp.experts.63.down_proj", "model.layers.7.mlp.experts.64.down_proj", "model.layers.7.mlp.experts.65.down_proj", "model.layers.7.mlp.experts.66.down_proj", "model.layers.7.mlp.experts.67.down_proj", "model.layers.7.mlp.experts.68.down_proj", "model.layers.7.mlp.experts.69.down_proj", "model.layers.7.mlp.experts.70.down_proj", "model.layers.7.mlp.experts.71.down_proj", "model.layers.7.mlp.experts.72.down_proj", "model.layers.7.mlp.experts.73.down_proj", "model.layers.7.mlp.experts.74.down_proj", "model.layers.7.mlp.experts.75.down_proj", "model.layers.7.mlp.experts.76.down_proj", "model.layers.7.mlp.experts.77.down_proj", "model.layers.7.mlp.experts.78.down_proj", "model.layers.7.mlp.experts.79.down_proj", "model.layers.7.mlp.experts.80.down_proj", "model.layers.7.mlp.experts.81.down_proj", "model.layers.7.mlp.experts.82.down_proj", "model.layers.7.mlp.experts.83.down_proj", "model.layers.7.mlp.experts.84.down_proj", "model.layers.7.mlp.experts.85.down_proj", "model.layers.7.mlp.experts.86.down_proj", "model.layers.7.mlp.experts.87.down_proj", "model.layers.7.mlp.experts.88.down_proj", "model.layers.7.mlp.experts.89.down_proj", "model.layers.7.mlp.experts.90.down_proj", "model.layers.7.mlp.experts.91.down_proj", "model.layers.7.mlp.experts.92.down_proj", "model.layers.7.mlp.experts.93.down_proj", "model.layers.7.mlp.experts.94.down_proj", "model.layers.7.mlp.experts.95.down_proj", "model.layers.7.mlp.experts.96.down_proj", "model.layers.7.mlp.experts.97.down_proj", "model.layers.7.mlp.experts.98.down_proj", "model.layers.7.mlp.experts.99.down_proj", "model.layers.7.mlp.experts.100.down_proj", "model.layers.7.mlp.experts.101.down_proj", "model.layers.7.mlp.experts.102.down_proj", "model.layers.7.mlp.experts.103.down_proj", "model.layers.7.mlp.experts.104.down_proj", "model.layers.7.mlp.experts.105.down_proj", "model.layers.7.mlp.experts.106.down_proj", "model.layers.7.mlp.experts.107.down_proj", "model.layers.7.mlp.experts.108.down_proj", "model.layers.7.mlp.experts.109.down_proj", "model.layers.7.mlp.experts.110.down_proj", "model.layers.7.mlp.experts.111.down_proj", "model.layers.7.mlp.experts.112.down_proj", "model.layers.7.mlp.experts.113.down_proj", "model.layers.7.mlp.experts.114.down_proj", "model.layers.7.mlp.experts.115.down_proj", "model.layers.7.mlp.experts.116.down_proj", "model.layers.7.mlp.experts.117.down_proj", "model.layers.7.mlp.experts.118.down_proj", "model.layers.7.mlp.experts.119.down_proj", "model.layers.7.mlp.experts.120.down_proj", "model.layers.7.mlp.experts.121.down_proj", "model.layers.7.mlp.experts.122.down_proj", "model.layers.7.mlp.experts.123.down_proj", "model.layers.7.mlp.experts.124.down_proj", "model.layers.7.mlp.experts.125.down_proj", "model.layers.7.mlp.experts.126.down_proj", "model.layers.7.mlp.experts.127.down_proj", "model.layers.7.mlp.experts.128.down_proj", "model.layers.7.mlp.experts.129.down_proj", "model.layers.7.mlp.experts.130.down_proj", "model.layers.7.mlp.experts.131.down_proj", "model.layers.7.mlp.experts.132.down_proj", "model.layers.7.mlp.experts.133.down_proj", "model.layers.7.mlp.experts.134.down_proj", "model.layers.7.mlp.experts.135.down_proj", "model.layers.7.mlp.experts.136.down_proj", "model.layers.7.mlp.experts.137.down_proj", "model.layers.7.mlp.experts.138.down_proj", "model.layers.7.mlp.experts.139.down_proj", "model.layers.7.mlp.experts.140.down_proj", "model.layers.7.mlp.experts.141.down_proj", "model.layers.7.mlp.experts.142.down_proj", "model.layers.7.mlp.experts.143.down_proj", "model.layers.7.mlp.experts.144.down_proj", "model.layers.7.mlp.experts.145.down_proj", "model.layers.7.mlp.experts.146.down_proj", "model.layers.7.mlp.experts.147.down_proj", "model.layers.7.mlp.experts.148.down_proj", "model.layers.7.mlp.experts.149.down_proj", "model.layers.7.mlp.experts.150.down_proj", "model.layers.7.mlp.experts.151.down_proj", "model.layers.7.mlp.experts.152.down_proj", "model.layers.7.mlp.experts.153.down_proj", "model.layers.7.mlp.experts.154.down_proj", "model.layers.7.mlp.experts.155.down_proj", "model.layers.7.mlp.experts.156.down_proj", "model.layers.7.mlp.experts.157.down_proj", "model.layers.7.mlp.experts.158.down_proj", "model.layers.7.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -5.64774964004755e-05, "dbits": 1258291200 }, { "dkld": -3.701751120388508e-05, "dbits": 2516582400 } ] }, { "idx": 45, "layers": [ "model.layers.8.self_attn.q_proj" ], "candidates": [ { "dkld": -5.074590444564819e-05, "dbits": 62914560 }, { "dkld": -2.3273169063031673e-05, "dbits": 125829120 } ] }, { "idx": 46, "layers": [ "model.layers.8.self_attn.k_proj", "model.layers.8.self_attn.v_proj" ], "candidates": [ { "dkld": -0.00010372237302362815, "dbits": 10485760 }, { "dkld": -0.00017430428415536776, "dbits": 20971520 } ] }, { "idx": 47, "layers": [ "model.layers.8.self_attn.o_proj" ], "candidates": [ { "dkld": 6.555453874170815e-05, "dbits": 62914560 }, { "dkld": 3.359396941959858e-05, "dbits": 125829120 } ] }, { "idx": 48, "layers": [ "model.layers.8.mlp.shared_experts.gate_proj", "model.layers.8.mlp.shared_experts.up_proj", "model.layers.8.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.00011860118247568503, "dbits": 23592960 }, { "dkld": -8.746017701923708e-05, "dbits": 47185920 } ] }, { "idx": 49, "layers": [ "model.layers.8.mlp.experts.0.gate_proj", "model.layers.8.mlp.experts.1.gate_proj", "model.layers.8.mlp.experts.2.gate_proj", "model.layers.8.mlp.experts.3.gate_proj", "model.layers.8.mlp.experts.4.gate_proj", "model.layers.8.mlp.experts.5.gate_proj", "model.layers.8.mlp.experts.6.gate_proj", "model.layers.8.mlp.experts.7.gate_proj", "model.layers.8.mlp.experts.8.gate_proj", "model.layers.8.mlp.experts.9.gate_proj", "model.layers.8.mlp.experts.10.gate_proj", "model.layers.8.mlp.experts.11.gate_proj", "model.layers.8.mlp.experts.12.gate_proj", "model.layers.8.mlp.experts.13.gate_proj", "model.layers.8.mlp.experts.14.gate_proj", "model.layers.8.mlp.experts.15.gate_proj", "model.layers.8.mlp.experts.16.gate_proj", "model.layers.8.mlp.experts.17.gate_proj", "model.layers.8.mlp.experts.18.gate_proj", "model.layers.8.mlp.experts.19.gate_proj", "model.layers.8.mlp.experts.20.gate_proj", "model.layers.8.mlp.experts.21.gate_proj", "model.layers.8.mlp.experts.22.gate_proj", "model.layers.8.mlp.experts.23.gate_proj", "model.layers.8.mlp.experts.24.gate_proj", "model.layers.8.mlp.experts.25.gate_proj", "model.layers.8.mlp.experts.26.gate_proj", "model.layers.8.mlp.experts.27.gate_proj", "model.layers.8.mlp.experts.28.gate_proj", "model.layers.8.mlp.experts.29.gate_proj", "model.layers.8.mlp.experts.30.gate_proj", "model.layers.8.mlp.experts.31.gate_proj", "model.layers.8.mlp.experts.32.gate_proj", "model.layers.8.mlp.experts.33.gate_proj", "model.layers.8.mlp.experts.34.gate_proj", "model.layers.8.mlp.experts.35.gate_proj", "model.layers.8.mlp.experts.36.gate_proj", "model.layers.8.mlp.experts.37.gate_proj", "model.layers.8.mlp.experts.38.gate_proj", "model.layers.8.mlp.experts.39.gate_proj", "model.layers.8.mlp.experts.40.gate_proj", "model.layers.8.mlp.experts.41.gate_proj", "model.layers.8.mlp.experts.42.gate_proj", "model.layers.8.mlp.experts.43.gate_proj", "model.layers.8.mlp.experts.44.gate_proj", "model.layers.8.mlp.experts.45.gate_proj", "model.layers.8.mlp.experts.46.gate_proj", "model.layers.8.mlp.experts.47.gate_proj", "model.layers.8.mlp.experts.48.gate_proj", "model.layers.8.mlp.experts.49.gate_proj", "model.layers.8.mlp.experts.50.gate_proj", "model.layers.8.mlp.experts.51.gate_proj", "model.layers.8.mlp.experts.52.gate_proj", "model.layers.8.mlp.experts.53.gate_proj", "model.layers.8.mlp.experts.54.gate_proj", "model.layers.8.mlp.experts.55.gate_proj", "model.layers.8.mlp.experts.56.gate_proj", "model.layers.8.mlp.experts.57.gate_proj", "model.layers.8.mlp.experts.58.gate_proj", "model.layers.8.mlp.experts.59.gate_proj", "model.layers.8.mlp.experts.60.gate_proj", "model.layers.8.mlp.experts.61.gate_proj", "model.layers.8.mlp.experts.62.gate_proj", "model.layers.8.mlp.experts.63.gate_proj", "model.layers.8.mlp.experts.64.gate_proj", "model.layers.8.mlp.experts.65.gate_proj", "model.layers.8.mlp.experts.66.gate_proj", "model.layers.8.mlp.experts.67.gate_proj", "model.layers.8.mlp.experts.68.gate_proj", "model.layers.8.mlp.experts.69.gate_proj", "model.layers.8.mlp.experts.70.gate_proj", "model.layers.8.mlp.experts.71.gate_proj", "model.layers.8.mlp.experts.72.gate_proj", "model.layers.8.mlp.experts.73.gate_proj", "model.layers.8.mlp.experts.74.gate_proj", "model.layers.8.mlp.experts.75.gate_proj", "model.layers.8.mlp.experts.76.gate_proj", "model.layers.8.mlp.experts.77.gate_proj", "model.layers.8.mlp.experts.78.gate_proj", "model.layers.8.mlp.experts.79.gate_proj", "model.layers.8.mlp.experts.80.gate_proj", "model.layers.8.mlp.experts.81.gate_proj", "model.layers.8.mlp.experts.82.gate_proj", "model.layers.8.mlp.experts.83.gate_proj", "model.layers.8.mlp.experts.84.gate_proj", "model.layers.8.mlp.experts.85.gate_proj", "model.layers.8.mlp.experts.86.gate_proj", "model.layers.8.mlp.experts.87.gate_proj", "model.layers.8.mlp.experts.88.gate_proj", "model.layers.8.mlp.experts.89.gate_proj", "model.layers.8.mlp.experts.90.gate_proj", "model.layers.8.mlp.experts.91.gate_proj", "model.layers.8.mlp.experts.92.gate_proj", "model.layers.8.mlp.experts.93.gate_proj", "model.layers.8.mlp.experts.94.gate_proj", "model.layers.8.mlp.experts.95.gate_proj", "model.layers.8.mlp.experts.96.gate_proj", "model.layers.8.mlp.experts.97.gate_proj", "model.layers.8.mlp.experts.98.gate_proj", "model.layers.8.mlp.experts.99.gate_proj", "model.layers.8.mlp.experts.100.gate_proj", "model.layers.8.mlp.experts.101.gate_proj", "model.layers.8.mlp.experts.102.gate_proj", "model.layers.8.mlp.experts.103.gate_proj", "model.layers.8.mlp.experts.104.gate_proj", "model.layers.8.mlp.experts.105.gate_proj", "model.layers.8.mlp.experts.106.gate_proj", "model.layers.8.mlp.experts.107.gate_proj", "model.layers.8.mlp.experts.108.gate_proj", "model.layers.8.mlp.experts.109.gate_proj", "model.layers.8.mlp.experts.110.gate_proj", "model.layers.8.mlp.experts.111.gate_proj", "model.layers.8.mlp.experts.112.gate_proj", "model.layers.8.mlp.experts.113.gate_proj", "model.layers.8.mlp.experts.114.gate_proj", "model.layers.8.mlp.experts.115.gate_proj", "model.layers.8.mlp.experts.116.gate_proj", "model.layers.8.mlp.experts.117.gate_proj", "model.layers.8.mlp.experts.118.gate_proj", "model.layers.8.mlp.experts.119.gate_proj", "model.layers.8.mlp.experts.120.gate_proj", "model.layers.8.mlp.experts.121.gate_proj", "model.layers.8.mlp.experts.122.gate_proj", "model.layers.8.mlp.experts.123.gate_proj", "model.layers.8.mlp.experts.124.gate_proj", "model.layers.8.mlp.experts.125.gate_proj", "model.layers.8.mlp.experts.126.gate_proj", "model.layers.8.mlp.experts.127.gate_proj", "model.layers.8.mlp.experts.128.gate_proj", "model.layers.8.mlp.experts.129.gate_proj", "model.layers.8.mlp.experts.130.gate_proj", "model.layers.8.mlp.experts.131.gate_proj", "model.layers.8.mlp.experts.132.gate_proj", "model.layers.8.mlp.experts.133.gate_proj", "model.layers.8.mlp.experts.134.gate_proj", "model.layers.8.mlp.experts.135.gate_proj", "model.layers.8.mlp.experts.136.gate_proj", "model.layers.8.mlp.experts.137.gate_proj", "model.layers.8.mlp.experts.138.gate_proj", "model.layers.8.mlp.experts.139.gate_proj", "model.layers.8.mlp.experts.140.gate_proj", "model.layers.8.mlp.experts.141.gate_proj", "model.layers.8.mlp.experts.142.gate_proj", "model.layers.8.mlp.experts.143.gate_proj", "model.layers.8.mlp.experts.144.gate_proj", "model.layers.8.mlp.experts.145.gate_proj", "model.layers.8.mlp.experts.146.gate_proj", "model.layers.8.mlp.experts.147.gate_proj", "model.layers.8.mlp.experts.148.gate_proj", "model.layers.8.mlp.experts.149.gate_proj", "model.layers.8.mlp.experts.150.gate_proj", "model.layers.8.mlp.experts.151.gate_proj", "model.layers.8.mlp.experts.152.gate_proj", "model.layers.8.mlp.experts.153.gate_proj", "model.layers.8.mlp.experts.154.gate_proj", "model.layers.8.mlp.experts.155.gate_proj", "model.layers.8.mlp.experts.156.gate_proj", "model.layers.8.mlp.experts.157.gate_proj", "model.layers.8.mlp.experts.158.gate_proj", "model.layers.8.mlp.experts.159.gate_proj", "model.layers.8.mlp.experts.0.up_proj", "model.layers.8.mlp.experts.1.up_proj", "model.layers.8.mlp.experts.2.up_proj", "model.layers.8.mlp.experts.3.up_proj", "model.layers.8.mlp.experts.4.up_proj", "model.layers.8.mlp.experts.5.up_proj", "model.layers.8.mlp.experts.6.up_proj", "model.layers.8.mlp.experts.7.up_proj", "model.layers.8.mlp.experts.8.up_proj", "model.layers.8.mlp.experts.9.up_proj", "model.layers.8.mlp.experts.10.up_proj", "model.layers.8.mlp.experts.11.up_proj", "model.layers.8.mlp.experts.12.up_proj", "model.layers.8.mlp.experts.13.up_proj", "model.layers.8.mlp.experts.14.up_proj", "model.layers.8.mlp.experts.15.up_proj", "model.layers.8.mlp.experts.16.up_proj", "model.layers.8.mlp.experts.17.up_proj", "model.layers.8.mlp.experts.18.up_proj", "model.layers.8.mlp.experts.19.up_proj", "model.layers.8.mlp.experts.20.up_proj", "model.layers.8.mlp.experts.21.up_proj", "model.layers.8.mlp.experts.22.up_proj", "model.layers.8.mlp.experts.23.up_proj", "model.layers.8.mlp.experts.24.up_proj", "model.layers.8.mlp.experts.25.up_proj", "model.layers.8.mlp.experts.26.up_proj", "model.layers.8.mlp.experts.27.up_proj", "model.layers.8.mlp.experts.28.up_proj", "model.layers.8.mlp.experts.29.up_proj", "model.layers.8.mlp.experts.30.up_proj", "model.layers.8.mlp.experts.31.up_proj", "model.layers.8.mlp.experts.32.up_proj", "model.layers.8.mlp.experts.33.up_proj", "model.layers.8.mlp.experts.34.up_proj", "model.layers.8.mlp.experts.35.up_proj", "model.layers.8.mlp.experts.36.up_proj", "model.layers.8.mlp.experts.37.up_proj", "model.layers.8.mlp.experts.38.up_proj", "model.layers.8.mlp.experts.39.up_proj", "model.layers.8.mlp.experts.40.up_proj", "model.layers.8.mlp.experts.41.up_proj", "model.layers.8.mlp.experts.42.up_proj", "model.layers.8.mlp.experts.43.up_proj", "model.layers.8.mlp.experts.44.up_proj", "model.layers.8.mlp.experts.45.up_proj", "model.layers.8.mlp.experts.46.up_proj", "model.layers.8.mlp.experts.47.up_proj", "model.layers.8.mlp.experts.48.up_proj", "model.layers.8.mlp.experts.49.up_proj", "model.layers.8.mlp.experts.50.up_proj", "model.layers.8.mlp.experts.51.up_proj", "model.layers.8.mlp.experts.52.up_proj", "model.layers.8.mlp.experts.53.up_proj", "model.layers.8.mlp.experts.54.up_proj", "model.layers.8.mlp.experts.55.up_proj", "model.layers.8.mlp.experts.56.up_proj", "model.layers.8.mlp.experts.57.up_proj", "model.layers.8.mlp.experts.58.up_proj", "model.layers.8.mlp.experts.59.up_proj", "model.layers.8.mlp.experts.60.up_proj", "model.layers.8.mlp.experts.61.up_proj", "model.layers.8.mlp.experts.62.up_proj", "model.layers.8.mlp.experts.63.up_proj", "model.layers.8.mlp.experts.64.up_proj", "model.layers.8.mlp.experts.65.up_proj", "model.layers.8.mlp.experts.66.up_proj", "model.layers.8.mlp.experts.67.up_proj", "model.layers.8.mlp.experts.68.up_proj", "model.layers.8.mlp.experts.69.up_proj", "model.layers.8.mlp.experts.70.up_proj", "model.layers.8.mlp.experts.71.up_proj", "model.layers.8.mlp.experts.72.up_proj", "model.layers.8.mlp.experts.73.up_proj", "model.layers.8.mlp.experts.74.up_proj", "model.layers.8.mlp.experts.75.up_proj", "model.layers.8.mlp.experts.76.up_proj", "model.layers.8.mlp.experts.77.up_proj", "model.layers.8.mlp.experts.78.up_proj", "model.layers.8.mlp.experts.79.up_proj", "model.layers.8.mlp.experts.80.up_proj", "model.layers.8.mlp.experts.81.up_proj", "model.layers.8.mlp.experts.82.up_proj", "model.layers.8.mlp.experts.83.up_proj", "model.layers.8.mlp.experts.84.up_proj", "model.layers.8.mlp.experts.85.up_proj", "model.layers.8.mlp.experts.86.up_proj", "model.layers.8.mlp.experts.87.up_proj", "model.layers.8.mlp.experts.88.up_proj", "model.layers.8.mlp.experts.89.up_proj", "model.layers.8.mlp.experts.90.up_proj", "model.layers.8.mlp.experts.91.up_proj", "model.layers.8.mlp.experts.92.up_proj", "model.layers.8.mlp.experts.93.up_proj", "model.layers.8.mlp.experts.94.up_proj", "model.layers.8.mlp.experts.95.up_proj", "model.layers.8.mlp.experts.96.up_proj", "model.layers.8.mlp.experts.97.up_proj", "model.layers.8.mlp.experts.98.up_proj", "model.layers.8.mlp.experts.99.up_proj", "model.layers.8.mlp.experts.100.up_proj", "model.layers.8.mlp.experts.101.up_proj", "model.layers.8.mlp.experts.102.up_proj", "model.layers.8.mlp.experts.103.up_proj", "model.layers.8.mlp.experts.104.up_proj", "model.layers.8.mlp.experts.105.up_proj", "model.layers.8.mlp.experts.106.up_proj", "model.layers.8.mlp.experts.107.up_proj", "model.layers.8.mlp.experts.108.up_proj", "model.layers.8.mlp.experts.109.up_proj", "model.layers.8.mlp.experts.110.up_proj", "model.layers.8.mlp.experts.111.up_proj", "model.layers.8.mlp.experts.112.up_proj", "model.layers.8.mlp.experts.113.up_proj", "model.layers.8.mlp.experts.114.up_proj", "model.layers.8.mlp.experts.115.up_proj", "model.layers.8.mlp.experts.116.up_proj", "model.layers.8.mlp.experts.117.up_proj", "model.layers.8.mlp.experts.118.up_proj", "model.layers.8.mlp.experts.119.up_proj", "model.layers.8.mlp.experts.120.up_proj", "model.layers.8.mlp.experts.121.up_proj", "model.layers.8.mlp.experts.122.up_proj", "model.layers.8.mlp.experts.123.up_proj", "model.layers.8.mlp.experts.124.up_proj", "model.layers.8.mlp.experts.125.up_proj", "model.layers.8.mlp.experts.126.up_proj", "model.layers.8.mlp.experts.127.up_proj", "model.layers.8.mlp.experts.128.up_proj", "model.layers.8.mlp.experts.129.up_proj", "model.layers.8.mlp.experts.130.up_proj", "model.layers.8.mlp.experts.131.up_proj", "model.layers.8.mlp.experts.132.up_proj", "model.layers.8.mlp.experts.133.up_proj", "model.layers.8.mlp.experts.134.up_proj", "model.layers.8.mlp.experts.135.up_proj", "model.layers.8.mlp.experts.136.up_proj", "model.layers.8.mlp.experts.137.up_proj", "model.layers.8.mlp.experts.138.up_proj", "model.layers.8.mlp.experts.139.up_proj", "model.layers.8.mlp.experts.140.up_proj", "model.layers.8.mlp.experts.141.up_proj", "model.layers.8.mlp.experts.142.up_proj", "model.layers.8.mlp.experts.143.up_proj", "model.layers.8.mlp.experts.144.up_proj", "model.layers.8.mlp.experts.145.up_proj", "model.layers.8.mlp.experts.146.up_proj", "model.layers.8.mlp.experts.147.up_proj", "model.layers.8.mlp.experts.148.up_proj", "model.layers.8.mlp.experts.149.up_proj", "model.layers.8.mlp.experts.150.up_proj", "model.layers.8.mlp.experts.151.up_proj", "model.layers.8.mlp.experts.152.up_proj", "model.layers.8.mlp.experts.153.up_proj", "model.layers.8.mlp.experts.154.up_proj", "model.layers.8.mlp.experts.155.up_proj", "model.layers.8.mlp.experts.156.up_proj", "model.layers.8.mlp.experts.157.up_proj", "model.layers.8.mlp.experts.158.up_proj", "model.layers.8.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.8852786161005844e-05, "dbits": 2516582400 }, { "dkld": -3.5988446325062665e-05, "dbits": 5033164800 } ] }, { "idx": 50, "layers": [ "model.layers.8.mlp.experts.0.down_proj", "model.layers.8.mlp.experts.1.down_proj", "model.layers.8.mlp.experts.2.down_proj", "model.layers.8.mlp.experts.3.down_proj", "model.layers.8.mlp.experts.4.down_proj", "model.layers.8.mlp.experts.5.down_proj", "model.layers.8.mlp.experts.6.down_proj", "model.layers.8.mlp.experts.7.down_proj", "model.layers.8.mlp.experts.8.down_proj", "model.layers.8.mlp.experts.9.down_proj", "model.layers.8.mlp.experts.10.down_proj", "model.layers.8.mlp.experts.11.down_proj", "model.layers.8.mlp.experts.12.down_proj", "model.layers.8.mlp.experts.13.down_proj", "model.layers.8.mlp.experts.14.down_proj", "model.layers.8.mlp.experts.15.down_proj", "model.layers.8.mlp.experts.16.down_proj", "model.layers.8.mlp.experts.17.down_proj", "model.layers.8.mlp.experts.18.down_proj", "model.layers.8.mlp.experts.19.down_proj", "model.layers.8.mlp.experts.20.down_proj", "model.layers.8.mlp.experts.21.down_proj", "model.layers.8.mlp.experts.22.down_proj", "model.layers.8.mlp.experts.23.down_proj", "model.layers.8.mlp.experts.24.down_proj", "model.layers.8.mlp.experts.25.down_proj", "model.layers.8.mlp.experts.26.down_proj", "model.layers.8.mlp.experts.27.down_proj", "model.layers.8.mlp.experts.28.down_proj", "model.layers.8.mlp.experts.29.down_proj", "model.layers.8.mlp.experts.30.down_proj", "model.layers.8.mlp.experts.31.down_proj", "model.layers.8.mlp.experts.32.down_proj", "model.layers.8.mlp.experts.33.down_proj", "model.layers.8.mlp.experts.34.down_proj", "model.layers.8.mlp.experts.35.down_proj", "model.layers.8.mlp.experts.36.down_proj", "model.layers.8.mlp.experts.37.down_proj", "model.layers.8.mlp.experts.38.down_proj", "model.layers.8.mlp.experts.39.down_proj", "model.layers.8.mlp.experts.40.down_proj", "model.layers.8.mlp.experts.41.down_proj", "model.layers.8.mlp.experts.42.down_proj", "model.layers.8.mlp.experts.43.down_proj", "model.layers.8.mlp.experts.44.down_proj", "model.layers.8.mlp.experts.45.down_proj", "model.layers.8.mlp.experts.46.down_proj", "model.layers.8.mlp.experts.47.down_proj", "model.layers.8.mlp.experts.48.down_proj", "model.layers.8.mlp.experts.49.down_proj", "model.layers.8.mlp.experts.50.down_proj", "model.layers.8.mlp.experts.51.down_proj", "model.layers.8.mlp.experts.52.down_proj", "model.layers.8.mlp.experts.53.down_proj", "model.layers.8.mlp.experts.54.down_proj", "model.layers.8.mlp.experts.55.down_proj", "model.layers.8.mlp.experts.56.down_proj", "model.layers.8.mlp.experts.57.down_proj", "model.layers.8.mlp.experts.58.down_proj", "model.layers.8.mlp.experts.59.down_proj", "model.layers.8.mlp.experts.60.down_proj", "model.layers.8.mlp.experts.61.down_proj", "model.layers.8.mlp.experts.62.down_proj", "model.layers.8.mlp.experts.63.down_proj", "model.layers.8.mlp.experts.64.down_proj", "model.layers.8.mlp.experts.65.down_proj", "model.layers.8.mlp.experts.66.down_proj", "model.layers.8.mlp.experts.67.down_proj", "model.layers.8.mlp.experts.68.down_proj", "model.layers.8.mlp.experts.69.down_proj", "model.layers.8.mlp.experts.70.down_proj", "model.layers.8.mlp.experts.71.down_proj", "model.layers.8.mlp.experts.72.down_proj", "model.layers.8.mlp.experts.73.down_proj", "model.layers.8.mlp.experts.74.down_proj", "model.layers.8.mlp.experts.75.down_proj", "model.layers.8.mlp.experts.76.down_proj", "model.layers.8.mlp.experts.77.down_proj", "model.layers.8.mlp.experts.78.down_proj", "model.layers.8.mlp.experts.79.down_proj", "model.layers.8.mlp.experts.80.down_proj", "model.layers.8.mlp.experts.81.down_proj", "model.layers.8.mlp.experts.82.down_proj", "model.layers.8.mlp.experts.83.down_proj", "model.layers.8.mlp.experts.84.down_proj", "model.layers.8.mlp.experts.85.down_proj", "model.layers.8.mlp.experts.86.down_proj", "model.layers.8.mlp.experts.87.down_proj", "model.layers.8.mlp.experts.88.down_proj", "model.layers.8.mlp.experts.89.down_proj", "model.layers.8.mlp.experts.90.down_proj", "model.layers.8.mlp.experts.91.down_proj", "model.layers.8.mlp.experts.92.down_proj", "model.layers.8.mlp.experts.93.down_proj", "model.layers.8.mlp.experts.94.down_proj", "model.layers.8.mlp.experts.95.down_proj", "model.layers.8.mlp.experts.96.down_proj", "model.layers.8.mlp.experts.97.down_proj", "model.layers.8.mlp.experts.98.down_proj", "model.layers.8.mlp.experts.99.down_proj", "model.layers.8.mlp.experts.100.down_proj", "model.layers.8.mlp.experts.101.down_proj", "model.layers.8.mlp.experts.102.down_proj", "model.layers.8.mlp.experts.103.down_proj", "model.layers.8.mlp.experts.104.down_proj", "model.layers.8.mlp.experts.105.down_proj", "model.layers.8.mlp.experts.106.down_proj", "model.layers.8.mlp.experts.107.down_proj", "model.layers.8.mlp.experts.108.down_proj", "model.layers.8.mlp.experts.109.down_proj", "model.layers.8.mlp.experts.110.down_proj", "model.layers.8.mlp.experts.111.down_proj", "model.layers.8.mlp.experts.112.down_proj", "model.layers.8.mlp.experts.113.down_proj", "model.layers.8.mlp.experts.114.down_proj", "model.layers.8.mlp.experts.115.down_proj", "model.layers.8.mlp.experts.116.down_proj", "model.layers.8.mlp.experts.117.down_proj", "model.layers.8.mlp.experts.118.down_proj", "model.layers.8.mlp.experts.119.down_proj", "model.layers.8.mlp.experts.120.down_proj", "model.layers.8.mlp.experts.121.down_proj", "model.layers.8.mlp.experts.122.down_proj", "model.layers.8.mlp.experts.123.down_proj", "model.layers.8.mlp.experts.124.down_proj", "model.layers.8.mlp.experts.125.down_proj", "model.layers.8.mlp.experts.126.down_proj", "model.layers.8.mlp.experts.127.down_proj", "model.layers.8.mlp.experts.128.down_proj", "model.layers.8.mlp.experts.129.down_proj", "model.layers.8.mlp.experts.130.down_proj", "model.layers.8.mlp.experts.131.down_proj", "model.layers.8.mlp.experts.132.down_proj", "model.layers.8.mlp.experts.133.down_proj", "model.layers.8.mlp.experts.134.down_proj", "model.layers.8.mlp.experts.135.down_proj", "model.layers.8.mlp.experts.136.down_proj", "model.layers.8.mlp.experts.137.down_proj", "model.layers.8.mlp.experts.138.down_proj", "model.layers.8.mlp.experts.139.down_proj", "model.layers.8.mlp.experts.140.down_proj", "model.layers.8.mlp.experts.141.down_proj", "model.layers.8.mlp.experts.142.down_proj", "model.layers.8.mlp.experts.143.down_proj", "model.layers.8.mlp.experts.144.down_proj", "model.layers.8.mlp.experts.145.down_proj", "model.layers.8.mlp.experts.146.down_proj", "model.layers.8.mlp.experts.147.down_proj", "model.layers.8.mlp.experts.148.down_proj", "model.layers.8.mlp.experts.149.down_proj", "model.layers.8.mlp.experts.150.down_proj", "model.layers.8.mlp.experts.151.down_proj", "model.layers.8.mlp.experts.152.down_proj", "model.layers.8.mlp.experts.153.down_proj", "model.layers.8.mlp.experts.154.down_proj", "model.layers.8.mlp.experts.155.down_proj", "model.layers.8.mlp.experts.156.down_proj", "model.layers.8.mlp.experts.157.down_proj", "model.layers.8.mlp.experts.158.down_proj", "model.layers.8.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -7.446110248565674e-05, "dbits": 1258291200 }, { "dkld": -5.373328458517686e-05, "dbits": 2516582400 } ] }, { "idx": 51, "layers": [ "model.layers.9.self_attn.q_proj" ], "candidates": [ { "dkld": -3.7198467180131825e-05, "dbits": 62914560 }, { "dkld": -3.7582591176019142e-06, "dbits": 125829120 } ] }, { "idx": 52, "layers": [ "model.layers.9.self_attn.k_proj", "model.layers.9.self_attn.v_proj" ], "candidates": [ { "dkld": 6.932145915925642e-05, "dbits": 10485760 }, { "dkld": 2.2798869758845763e-05, "dbits": 20971520 } ] }, { "idx": 53, "layers": [ "model.layers.9.self_attn.o_proj" ], "candidates": [ { "dkld": -4.819061141460995e-05, "dbits": 62914560 }, { "dkld": -0.00011790816206484929, "dbits": 125829120 } ] }, { "idx": 54, "layers": [ "model.layers.9.mlp.shared_experts.gate_proj", "model.layers.9.mlp.shared_experts.up_proj", "model.layers.9.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 8.194232359528576e-05, "dbits": 23592960 }, { "dkld": 7.315184921026334e-05, "dbits": 47185920 } ] }, { "idx": 55, "layers": [ "model.layers.9.mlp.experts.0.gate_proj", "model.layers.9.mlp.experts.1.gate_proj", "model.layers.9.mlp.experts.2.gate_proj", "model.layers.9.mlp.experts.3.gate_proj", "model.layers.9.mlp.experts.4.gate_proj", "model.layers.9.mlp.experts.5.gate_proj", "model.layers.9.mlp.experts.6.gate_proj", "model.layers.9.mlp.experts.7.gate_proj", "model.layers.9.mlp.experts.8.gate_proj", "model.layers.9.mlp.experts.9.gate_proj", "model.layers.9.mlp.experts.10.gate_proj", "model.layers.9.mlp.experts.11.gate_proj", "model.layers.9.mlp.experts.12.gate_proj", "model.layers.9.mlp.experts.13.gate_proj", "model.layers.9.mlp.experts.14.gate_proj", "model.layers.9.mlp.experts.15.gate_proj", "model.layers.9.mlp.experts.16.gate_proj", "model.layers.9.mlp.experts.17.gate_proj", "model.layers.9.mlp.experts.18.gate_proj", "model.layers.9.mlp.experts.19.gate_proj", "model.layers.9.mlp.experts.20.gate_proj", "model.layers.9.mlp.experts.21.gate_proj", "model.layers.9.mlp.experts.22.gate_proj", "model.layers.9.mlp.experts.23.gate_proj", "model.layers.9.mlp.experts.24.gate_proj", "model.layers.9.mlp.experts.25.gate_proj", "model.layers.9.mlp.experts.26.gate_proj", "model.layers.9.mlp.experts.27.gate_proj", "model.layers.9.mlp.experts.28.gate_proj", "model.layers.9.mlp.experts.29.gate_proj", "model.layers.9.mlp.experts.30.gate_proj", "model.layers.9.mlp.experts.31.gate_proj", "model.layers.9.mlp.experts.32.gate_proj", "model.layers.9.mlp.experts.33.gate_proj", "model.layers.9.mlp.experts.34.gate_proj", "model.layers.9.mlp.experts.35.gate_proj", "model.layers.9.mlp.experts.36.gate_proj", "model.layers.9.mlp.experts.37.gate_proj", "model.layers.9.mlp.experts.38.gate_proj", "model.layers.9.mlp.experts.39.gate_proj", "model.layers.9.mlp.experts.40.gate_proj", "model.layers.9.mlp.experts.41.gate_proj", "model.layers.9.mlp.experts.42.gate_proj", "model.layers.9.mlp.experts.43.gate_proj", "model.layers.9.mlp.experts.44.gate_proj", "model.layers.9.mlp.experts.45.gate_proj", "model.layers.9.mlp.experts.46.gate_proj", "model.layers.9.mlp.experts.47.gate_proj", "model.layers.9.mlp.experts.48.gate_proj", "model.layers.9.mlp.experts.49.gate_proj", "model.layers.9.mlp.experts.50.gate_proj", "model.layers.9.mlp.experts.51.gate_proj", "model.layers.9.mlp.experts.52.gate_proj", "model.layers.9.mlp.experts.53.gate_proj", "model.layers.9.mlp.experts.54.gate_proj", "model.layers.9.mlp.experts.55.gate_proj", "model.layers.9.mlp.experts.56.gate_proj", "model.layers.9.mlp.experts.57.gate_proj", "model.layers.9.mlp.experts.58.gate_proj", "model.layers.9.mlp.experts.59.gate_proj", "model.layers.9.mlp.experts.60.gate_proj", "model.layers.9.mlp.experts.61.gate_proj", "model.layers.9.mlp.experts.62.gate_proj", "model.layers.9.mlp.experts.63.gate_proj", "model.layers.9.mlp.experts.64.gate_proj", "model.layers.9.mlp.experts.65.gate_proj", "model.layers.9.mlp.experts.66.gate_proj", "model.layers.9.mlp.experts.67.gate_proj", "model.layers.9.mlp.experts.68.gate_proj", "model.layers.9.mlp.experts.69.gate_proj", "model.layers.9.mlp.experts.70.gate_proj", "model.layers.9.mlp.experts.71.gate_proj", "model.layers.9.mlp.experts.72.gate_proj", "model.layers.9.mlp.experts.73.gate_proj", "model.layers.9.mlp.experts.74.gate_proj", "model.layers.9.mlp.experts.75.gate_proj", "model.layers.9.mlp.experts.76.gate_proj", "model.layers.9.mlp.experts.77.gate_proj", "model.layers.9.mlp.experts.78.gate_proj", "model.layers.9.mlp.experts.79.gate_proj", "model.layers.9.mlp.experts.80.gate_proj", "model.layers.9.mlp.experts.81.gate_proj", "model.layers.9.mlp.experts.82.gate_proj", "model.layers.9.mlp.experts.83.gate_proj", "model.layers.9.mlp.experts.84.gate_proj", "model.layers.9.mlp.experts.85.gate_proj", "model.layers.9.mlp.experts.86.gate_proj", "model.layers.9.mlp.experts.87.gate_proj", "model.layers.9.mlp.experts.88.gate_proj", "model.layers.9.mlp.experts.89.gate_proj", "model.layers.9.mlp.experts.90.gate_proj", "model.layers.9.mlp.experts.91.gate_proj", "model.layers.9.mlp.experts.92.gate_proj", "model.layers.9.mlp.experts.93.gate_proj", "model.layers.9.mlp.experts.94.gate_proj", "model.layers.9.mlp.experts.95.gate_proj", "model.layers.9.mlp.experts.96.gate_proj", "model.layers.9.mlp.experts.97.gate_proj", "model.layers.9.mlp.experts.98.gate_proj", "model.layers.9.mlp.experts.99.gate_proj", "model.layers.9.mlp.experts.100.gate_proj", "model.layers.9.mlp.experts.101.gate_proj", "model.layers.9.mlp.experts.102.gate_proj", "model.layers.9.mlp.experts.103.gate_proj", "model.layers.9.mlp.experts.104.gate_proj", "model.layers.9.mlp.experts.105.gate_proj", "model.layers.9.mlp.experts.106.gate_proj", "model.layers.9.mlp.experts.107.gate_proj", "model.layers.9.mlp.experts.108.gate_proj", "model.layers.9.mlp.experts.109.gate_proj", "model.layers.9.mlp.experts.110.gate_proj", "model.layers.9.mlp.experts.111.gate_proj", "model.layers.9.mlp.experts.112.gate_proj", "model.layers.9.mlp.experts.113.gate_proj", "model.layers.9.mlp.experts.114.gate_proj", "model.layers.9.mlp.experts.115.gate_proj", "model.layers.9.mlp.experts.116.gate_proj", "model.layers.9.mlp.experts.117.gate_proj", "model.layers.9.mlp.experts.118.gate_proj", "model.layers.9.mlp.experts.119.gate_proj", "model.layers.9.mlp.experts.120.gate_proj", "model.layers.9.mlp.experts.121.gate_proj", "model.layers.9.mlp.experts.122.gate_proj", "model.layers.9.mlp.experts.123.gate_proj", "model.layers.9.mlp.experts.124.gate_proj", "model.layers.9.mlp.experts.125.gate_proj", "model.layers.9.mlp.experts.126.gate_proj", "model.layers.9.mlp.experts.127.gate_proj", "model.layers.9.mlp.experts.128.gate_proj", "model.layers.9.mlp.experts.129.gate_proj", "model.layers.9.mlp.experts.130.gate_proj", "model.layers.9.mlp.experts.131.gate_proj", "model.layers.9.mlp.experts.132.gate_proj", "model.layers.9.mlp.experts.133.gate_proj", "model.layers.9.mlp.experts.134.gate_proj", "model.layers.9.mlp.experts.135.gate_proj", "model.layers.9.mlp.experts.136.gate_proj", "model.layers.9.mlp.experts.137.gate_proj", "model.layers.9.mlp.experts.138.gate_proj", "model.layers.9.mlp.experts.139.gate_proj", "model.layers.9.mlp.experts.140.gate_proj", "model.layers.9.mlp.experts.141.gate_proj", "model.layers.9.mlp.experts.142.gate_proj", "model.layers.9.mlp.experts.143.gate_proj", "model.layers.9.mlp.experts.144.gate_proj", "model.layers.9.mlp.experts.145.gate_proj", "model.layers.9.mlp.experts.146.gate_proj", "model.layers.9.mlp.experts.147.gate_proj", "model.layers.9.mlp.experts.148.gate_proj", "model.layers.9.mlp.experts.149.gate_proj", "model.layers.9.mlp.experts.150.gate_proj", "model.layers.9.mlp.experts.151.gate_proj", "model.layers.9.mlp.experts.152.gate_proj", "model.layers.9.mlp.experts.153.gate_proj", "model.layers.9.mlp.experts.154.gate_proj", "model.layers.9.mlp.experts.155.gate_proj", "model.layers.9.mlp.experts.156.gate_proj", "model.layers.9.mlp.experts.157.gate_proj", "model.layers.9.mlp.experts.158.gate_proj", "model.layers.9.mlp.experts.159.gate_proj", "model.layers.9.mlp.experts.0.up_proj", "model.layers.9.mlp.experts.1.up_proj", "model.layers.9.mlp.experts.2.up_proj", "model.layers.9.mlp.experts.3.up_proj", "model.layers.9.mlp.experts.4.up_proj", "model.layers.9.mlp.experts.5.up_proj", "model.layers.9.mlp.experts.6.up_proj", "model.layers.9.mlp.experts.7.up_proj", "model.layers.9.mlp.experts.8.up_proj", "model.layers.9.mlp.experts.9.up_proj", "model.layers.9.mlp.experts.10.up_proj", "model.layers.9.mlp.experts.11.up_proj", "model.layers.9.mlp.experts.12.up_proj", "model.layers.9.mlp.experts.13.up_proj", "model.layers.9.mlp.experts.14.up_proj", "model.layers.9.mlp.experts.15.up_proj", "model.layers.9.mlp.experts.16.up_proj", "model.layers.9.mlp.experts.17.up_proj", "model.layers.9.mlp.experts.18.up_proj", "model.layers.9.mlp.experts.19.up_proj", "model.layers.9.mlp.experts.20.up_proj", "model.layers.9.mlp.experts.21.up_proj", "model.layers.9.mlp.experts.22.up_proj", "model.layers.9.mlp.experts.23.up_proj", "model.layers.9.mlp.experts.24.up_proj", "model.layers.9.mlp.experts.25.up_proj", "model.layers.9.mlp.experts.26.up_proj", "model.layers.9.mlp.experts.27.up_proj", "model.layers.9.mlp.experts.28.up_proj", "model.layers.9.mlp.experts.29.up_proj", "model.layers.9.mlp.experts.30.up_proj", "model.layers.9.mlp.experts.31.up_proj", "model.layers.9.mlp.experts.32.up_proj", "model.layers.9.mlp.experts.33.up_proj", "model.layers.9.mlp.experts.34.up_proj", "model.layers.9.mlp.experts.35.up_proj", "model.layers.9.mlp.experts.36.up_proj", "model.layers.9.mlp.experts.37.up_proj", "model.layers.9.mlp.experts.38.up_proj", "model.layers.9.mlp.experts.39.up_proj", "model.layers.9.mlp.experts.40.up_proj", "model.layers.9.mlp.experts.41.up_proj", "model.layers.9.mlp.experts.42.up_proj", "model.layers.9.mlp.experts.43.up_proj", "model.layers.9.mlp.experts.44.up_proj", "model.layers.9.mlp.experts.45.up_proj", "model.layers.9.mlp.experts.46.up_proj", "model.layers.9.mlp.experts.47.up_proj", "model.layers.9.mlp.experts.48.up_proj", "model.layers.9.mlp.experts.49.up_proj", "model.layers.9.mlp.experts.50.up_proj", "model.layers.9.mlp.experts.51.up_proj", "model.layers.9.mlp.experts.52.up_proj", "model.layers.9.mlp.experts.53.up_proj", "model.layers.9.mlp.experts.54.up_proj", "model.layers.9.mlp.experts.55.up_proj", "model.layers.9.mlp.experts.56.up_proj", "model.layers.9.mlp.experts.57.up_proj", "model.layers.9.mlp.experts.58.up_proj", "model.layers.9.mlp.experts.59.up_proj", "model.layers.9.mlp.experts.60.up_proj", "model.layers.9.mlp.experts.61.up_proj", "model.layers.9.mlp.experts.62.up_proj", "model.layers.9.mlp.experts.63.up_proj", "model.layers.9.mlp.experts.64.up_proj", "model.layers.9.mlp.experts.65.up_proj", "model.layers.9.mlp.experts.66.up_proj", "model.layers.9.mlp.experts.67.up_proj", "model.layers.9.mlp.experts.68.up_proj", "model.layers.9.mlp.experts.69.up_proj", "model.layers.9.mlp.experts.70.up_proj", "model.layers.9.mlp.experts.71.up_proj", "model.layers.9.mlp.experts.72.up_proj", "model.layers.9.mlp.experts.73.up_proj", "model.layers.9.mlp.experts.74.up_proj", "model.layers.9.mlp.experts.75.up_proj", "model.layers.9.mlp.experts.76.up_proj", "model.layers.9.mlp.experts.77.up_proj", "model.layers.9.mlp.experts.78.up_proj", "model.layers.9.mlp.experts.79.up_proj", "model.layers.9.mlp.experts.80.up_proj", "model.layers.9.mlp.experts.81.up_proj", "model.layers.9.mlp.experts.82.up_proj", "model.layers.9.mlp.experts.83.up_proj", "model.layers.9.mlp.experts.84.up_proj", "model.layers.9.mlp.experts.85.up_proj", "model.layers.9.mlp.experts.86.up_proj", "model.layers.9.mlp.experts.87.up_proj", "model.layers.9.mlp.experts.88.up_proj", "model.layers.9.mlp.experts.89.up_proj", "model.layers.9.mlp.experts.90.up_proj", "model.layers.9.mlp.experts.91.up_proj", "model.layers.9.mlp.experts.92.up_proj", "model.layers.9.mlp.experts.93.up_proj", "model.layers.9.mlp.experts.94.up_proj", "model.layers.9.mlp.experts.95.up_proj", "model.layers.9.mlp.experts.96.up_proj", "model.layers.9.mlp.experts.97.up_proj", "model.layers.9.mlp.experts.98.up_proj", "model.layers.9.mlp.experts.99.up_proj", "model.layers.9.mlp.experts.100.up_proj", "model.layers.9.mlp.experts.101.up_proj", "model.layers.9.mlp.experts.102.up_proj", "model.layers.9.mlp.experts.103.up_proj", "model.layers.9.mlp.experts.104.up_proj", "model.layers.9.mlp.experts.105.up_proj", "model.layers.9.mlp.experts.106.up_proj", "model.layers.9.mlp.experts.107.up_proj", "model.layers.9.mlp.experts.108.up_proj", "model.layers.9.mlp.experts.109.up_proj", "model.layers.9.mlp.experts.110.up_proj", "model.layers.9.mlp.experts.111.up_proj", "model.layers.9.mlp.experts.112.up_proj", "model.layers.9.mlp.experts.113.up_proj", "model.layers.9.mlp.experts.114.up_proj", "model.layers.9.mlp.experts.115.up_proj", "model.layers.9.mlp.experts.116.up_proj", "model.layers.9.mlp.experts.117.up_proj", "model.layers.9.mlp.experts.118.up_proj", "model.layers.9.mlp.experts.119.up_proj", "model.layers.9.mlp.experts.120.up_proj", "model.layers.9.mlp.experts.121.up_proj", "model.layers.9.mlp.experts.122.up_proj", "model.layers.9.mlp.experts.123.up_proj", "model.layers.9.mlp.experts.124.up_proj", "model.layers.9.mlp.experts.125.up_proj", "model.layers.9.mlp.experts.126.up_proj", "model.layers.9.mlp.experts.127.up_proj", "model.layers.9.mlp.experts.128.up_proj", "model.layers.9.mlp.experts.129.up_proj", "model.layers.9.mlp.experts.130.up_proj", "model.layers.9.mlp.experts.131.up_proj", "model.layers.9.mlp.experts.132.up_proj", "model.layers.9.mlp.experts.133.up_proj", "model.layers.9.mlp.experts.134.up_proj", "model.layers.9.mlp.experts.135.up_proj", "model.layers.9.mlp.experts.136.up_proj", "model.layers.9.mlp.experts.137.up_proj", "model.layers.9.mlp.experts.138.up_proj", "model.layers.9.mlp.experts.139.up_proj", "model.layers.9.mlp.experts.140.up_proj", "model.layers.9.mlp.experts.141.up_proj", "model.layers.9.mlp.experts.142.up_proj", "model.layers.9.mlp.experts.143.up_proj", "model.layers.9.mlp.experts.144.up_proj", "model.layers.9.mlp.experts.145.up_proj", "model.layers.9.mlp.experts.146.up_proj", "model.layers.9.mlp.experts.147.up_proj", "model.layers.9.mlp.experts.148.up_proj", "model.layers.9.mlp.experts.149.up_proj", "model.layers.9.mlp.experts.150.up_proj", "model.layers.9.mlp.experts.151.up_proj", "model.layers.9.mlp.experts.152.up_proj", "model.layers.9.mlp.experts.153.up_proj", "model.layers.9.mlp.experts.154.up_proj", "model.layers.9.mlp.experts.155.up_proj", "model.layers.9.mlp.experts.156.up_proj", "model.layers.9.mlp.experts.157.up_proj", "model.layers.9.mlp.experts.158.up_proj", "model.layers.9.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.717869985848596e-05, "dbits": 2516582400 }, { "dkld": -7.660232950001955e-05, "dbits": 5033164800 } ] }, { "idx": 56, "layers": [ "model.layers.9.mlp.experts.0.down_proj", "model.layers.9.mlp.experts.1.down_proj", "model.layers.9.mlp.experts.2.down_proj", "model.layers.9.mlp.experts.3.down_proj", "model.layers.9.mlp.experts.4.down_proj", "model.layers.9.mlp.experts.5.down_proj", "model.layers.9.mlp.experts.6.down_proj", "model.layers.9.mlp.experts.7.down_proj", "model.layers.9.mlp.experts.8.down_proj", "model.layers.9.mlp.experts.9.down_proj", "model.layers.9.mlp.experts.10.down_proj", "model.layers.9.mlp.experts.11.down_proj", "model.layers.9.mlp.experts.12.down_proj", "model.layers.9.mlp.experts.13.down_proj", "model.layers.9.mlp.experts.14.down_proj", "model.layers.9.mlp.experts.15.down_proj", "model.layers.9.mlp.experts.16.down_proj", "model.layers.9.mlp.experts.17.down_proj", "model.layers.9.mlp.experts.18.down_proj", "model.layers.9.mlp.experts.19.down_proj", "model.layers.9.mlp.experts.20.down_proj", "model.layers.9.mlp.experts.21.down_proj", "model.layers.9.mlp.experts.22.down_proj", "model.layers.9.mlp.experts.23.down_proj", "model.layers.9.mlp.experts.24.down_proj", "model.layers.9.mlp.experts.25.down_proj", "model.layers.9.mlp.experts.26.down_proj", "model.layers.9.mlp.experts.27.down_proj", "model.layers.9.mlp.experts.28.down_proj", "model.layers.9.mlp.experts.29.down_proj", "model.layers.9.mlp.experts.30.down_proj", "model.layers.9.mlp.experts.31.down_proj", "model.layers.9.mlp.experts.32.down_proj", "model.layers.9.mlp.experts.33.down_proj", "model.layers.9.mlp.experts.34.down_proj", "model.layers.9.mlp.experts.35.down_proj", "model.layers.9.mlp.experts.36.down_proj", "model.layers.9.mlp.experts.37.down_proj", "model.layers.9.mlp.experts.38.down_proj", "model.layers.9.mlp.experts.39.down_proj", "model.layers.9.mlp.experts.40.down_proj", "model.layers.9.mlp.experts.41.down_proj", "model.layers.9.mlp.experts.42.down_proj", "model.layers.9.mlp.experts.43.down_proj", "model.layers.9.mlp.experts.44.down_proj", "model.layers.9.mlp.experts.45.down_proj", "model.layers.9.mlp.experts.46.down_proj", "model.layers.9.mlp.experts.47.down_proj", "model.layers.9.mlp.experts.48.down_proj", "model.layers.9.mlp.experts.49.down_proj", "model.layers.9.mlp.experts.50.down_proj", "model.layers.9.mlp.experts.51.down_proj", "model.layers.9.mlp.experts.52.down_proj", "model.layers.9.mlp.experts.53.down_proj", "model.layers.9.mlp.experts.54.down_proj", "model.layers.9.mlp.experts.55.down_proj", "model.layers.9.mlp.experts.56.down_proj", "model.layers.9.mlp.experts.57.down_proj", "model.layers.9.mlp.experts.58.down_proj", "model.layers.9.mlp.experts.59.down_proj", "model.layers.9.mlp.experts.60.down_proj", "model.layers.9.mlp.experts.61.down_proj", "model.layers.9.mlp.experts.62.down_proj", "model.layers.9.mlp.experts.63.down_proj", "model.layers.9.mlp.experts.64.down_proj", "model.layers.9.mlp.experts.65.down_proj", "model.layers.9.mlp.experts.66.down_proj", "model.layers.9.mlp.experts.67.down_proj", "model.layers.9.mlp.experts.68.down_proj", "model.layers.9.mlp.experts.69.down_proj", "model.layers.9.mlp.experts.70.down_proj", "model.layers.9.mlp.experts.71.down_proj", "model.layers.9.mlp.experts.72.down_proj", "model.layers.9.mlp.experts.73.down_proj", "model.layers.9.mlp.experts.74.down_proj", "model.layers.9.mlp.experts.75.down_proj", "model.layers.9.mlp.experts.76.down_proj", "model.layers.9.mlp.experts.77.down_proj", "model.layers.9.mlp.experts.78.down_proj", "model.layers.9.mlp.experts.79.down_proj", "model.layers.9.mlp.experts.80.down_proj", "model.layers.9.mlp.experts.81.down_proj", "model.layers.9.mlp.experts.82.down_proj", "model.layers.9.mlp.experts.83.down_proj", "model.layers.9.mlp.experts.84.down_proj", "model.layers.9.mlp.experts.85.down_proj", "model.layers.9.mlp.experts.86.down_proj", "model.layers.9.mlp.experts.87.down_proj", "model.layers.9.mlp.experts.88.down_proj", "model.layers.9.mlp.experts.89.down_proj", "model.layers.9.mlp.experts.90.down_proj", "model.layers.9.mlp.experts.91.down_proj", "model.layers.9.mlp.experts.92.down_proj", "model.layers.9.mlp.experts.93.down_proj", "model.layers.9.mlp.experts.94.down_proj", "model.layers.9.mlp.experts.95.down_proj", "model.layers.9.mlp.experts.96.down_proj", "model.layers.9.mlp.experts.97.down_proj", "model.layers.9.mlp.experts.98.down_proj", "model.layers.9.mlp.experts.99.down_proj", "model.layers.9.mlp.experts.100.down_proj", "model.layers.9.mlp.experts.101.down_proj", "model.layers.9.mlp.experts.102.down_proj", "model.layers.9.mlp.experts.103.down_proj", "model.layers.9.mlp.experts.104.down_proj", "model.layers.9.mlp.experts.105.down_proj", "model.layers.9.mlp.experts.106.down_proj", "model.layers.9.mlp.experts.107.down_proj", "model.layers.9.mlp.experts.108.down_proj", "model.layers.9.mlp.experts.109.down_proj", "model.layers.9.mlp.experts.110.down_proj", "model.layers.9.mlp.experts.111.down_proj", "model.layers.9.mlp.experts.112.down_proj", "model.layers.9.mlp.experts.113.down_proj", "model.layers.9.mlp.experts.114.down_proj", "model.layers.9.mlp.experts.115.down_proj", "model.layers.9.mlp.experts.116.down_proj", "model.layers.9.mlp.experts.117.down_proj", "model.layers.9.mlp.experts.118.down_proj", "model.layers.9.mlp.experts.119.down_proj", "model.layers.9.mlp.experts.120.down_proj", "model.layers.9.mlp.experts.121.down_proj", "model.layers.9.mlp.experts.122.down_proj", "model.layers.9.mlp.experts.123.down_proj", "model.layers.9.mlp.experts.124.down_proj", "model.layers.9.mlp.experts.125.down_proj", "model.layers.9.mlp.experts.126.down_proj", "model.layers.9.mlp.experts.127.down_proj", "model.layers.9.mlp.experts.128.down_proj", "model.layers.9.mlp.experts.129.down_proj", "model.layers.9.mlp.experts.130.down_proj", "model.layers.9.mlp.experts.131.down_proj", "model.layers.9.mlp.experts.132.down_proj", "model.layers.9.mlp.experts.133.down_proj", "model.layers.9.mlp.experts.134.down_proj", "model.layers.9.mlp.experts.135.down_proj", "model.layers.9.mlp.experts.136.down_proj", "model.layers.9.mlp.experts.137.down_proj", "model.layers.9.mlp.experts.138.down_proj", "model.layers.9.mlp.experts.139.down_proj", "model.layers.9.mlp.experts.140.down_proj", "model.layers.9.mlp.experts.141.down_proj", "model.layers.9.mlp.experts.142.down_proj", "model.layers.9.mlp.experts.143.down_proj", "model.layers.9.mlp.experts.144.down_proj", "model.layers.9.mlp.experts.145.down_proj", "model.layers.9.mlp.experts.146.down_proj", "model.layers.9.mlp.experts.147.down_proj", "model.layers.9.mlp.experts.148.down_proj", "model.layers.9.mlp.experts.149.down_proj", "model.layers.9.mlp.experts.150.down_proj", "model.layers.9.mlp.experts.151.down_proj", "model.layers.9.mlp.experts.152.down_proj", "model.layers.9.mlp.experts.153.down_proj", "model.layers.9.mlp.experts.154.down_proj", "model.layers.9.mlp.experts.155.down_proj", "model.layers.9.mlp.experts.156.down_proj", "model.layers.9.mlp.experts.157.down_proj", "model.layers.9.mlp.experts.158.down_proj", "model.layers.9.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -3.454315010458127e-05, "dbits": 1258291200 }, { "dkld": 1.257183030247723e-05, "dbits": 2516582400 } ] }, { "idx": 57, "layers": [ "model.layers.10.self_attn.q_proj" ], "candidates": [ { "dkld": -4.397414159029722e-05, "dbits": 62914560 }, { "dkld": 2.950150519610492e-06, "dbits": 125829120 } ] }, { "idx": 58, "layers": [ "model.layers.10.self_attn.k_proj", "model.layers.10.self_attn.v_proj" ], "candidates": [ { "dkld": 0.00010748510248959064, "dbits": 10485760 }, { "dkld": -0.00013290527276694705, "dbits": 20971520 } ] }, { "idx": 59, "layers": [ "model.layers.10.self_attn.o_proj" ], "candidates": [ { "dkld": -0.00019829133525490691, "dbits": 62914560 }, { "dkld": -0.00016102313529699902, "dbits": 125829120 } ] }, { "idx": 60, "layers": [ "model.layers.10.mlp.shared_experts.gate_proj", "model.layers.10.mlp.shared_experts.up_proj", "model.layers.10.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 2.248515374958515e-05, "dbits": 23592960 }, { "dkld": 1.4096056111157287e-05, "dbits": 47185920 } ] }, { "idx": 61, "layers": [ "model.layers.10.mlp.experts.0.gate_proj", "model.layers.10.mlp.experts.1.gate_proj", "model.layers.10.mlp.experts.2.gate_proj", "model.layers.10.mlp.experts.3.gate_proj", "model.layers.10.mlp.experts.4.gate_proj", "model.layers.10.mlp.experts.5.gate_proj", "model.layers.10.mlp.experts.6.gate_proj", "model.layers.10.mlp.experts.7.gate_proj", "model.layers.10.mlp.experts.8.gate_proj", "model.layers.10.mlp.experts.9.gate_proj", "model.layers.10.mlp.experts.10.gate_proj", "model.layers.10.mlp.experts.11.gate_proj", "model.layers.10.mlp.experts.12.gate_proj", "model.layers.10.mlp.experts.13.gate_proj", "model.layers.10.mlp.experts.14.gate_proj", "model.layers.10.mlp.experts.15.gate_proj", "model.layers.10.mlp.experts.16.gate_proj", "model.layers.10.mlp.experts.17.gate_proj", "model.layers.10.mlp.experts.18.gate_proj", "model.layers.10.mlp.experts.19.gate_proj", "model.layers.10.mlp.experts.20.gate_proj", "model.layers.10.mlp.experts.21.gate_proj", "model.layers.10.mlp.experts.22.gate_proj", "model.layers.10.mlp.experts.23.gate_proj", "model.layers.10.mlp.experts.24.gate_proj", "model.layers.10.mlp.experts.25.gate_proj", "model.layers.10.mlp.experts.26.gate_proj", "model.layers.10.mlp.experts.27.gate_proj", "model.layers.10.mlp.experts.28.gate_proj", "model.layers.10.mlp.experts.29.gate_proj", "model.layers.10.mlp.experts.30.gate_proj", "model.layers.10.mlp.experts.31.gate_proj", "model.layers.10.mlp.experts.32.gate_proj", "model.layers.10.mlp.experts.33.gate_proj", "model.layers.10.mlp.experts.34.gate_proj", "model.layers.10.mlp.experts.35.gate_proj", "model.layers.10.mlp.experts.36.gate_proj", "model.layers.10.mlp.experts.37.gate_proj", "model.layers.10.mlp.experts.38.gate_proj", "model.layers.10.mlp.experts.39.gate_proj", "model.layers.10.mlp.experts.40.gate_proj", "model.layers.10.mlp.experts.41.gate_proj", "model.layers.10.mlp.experts.42.gate_proj", "model.layers.10.mlp.experts.43.gate_proj", "model.layers.10.mlp.experts.44.gate_proj", "model.layers.10.mlp.experts.45.gate_proj", "model.layers.10.mlp.experts.46.gate_proj", "model.layers.10.mlp.experts.47.gate_proj", "model.layers.10.mlp.experts.48.gate_proj", "model.layers.10.mlp.experts.49.gate_proj", "model.layers.10.mlp.experts.50.gate_proj", "model.layers.10.mlp.experts.51.gate_proj", "model.layers.10.mlp.experts.52.gate_proj", "model.layers.10.mlp.experts.53.gate_proj", "model.layers.10.mlp.experts.54.gate_proj", "model.layers.10.mlp.experts.55.gate_proj", "model.layers.10.mlp.experts.56.gate_proj", "model.layers.10.mlp.experts.57.gate_proj", "model.layers.10.mlp.experts.58.gate_proj", "model.layers.10.mlp.experts.59.gate_proj", "model.layers.10.mlp.experts.60.gate_proj", "model.layers.10.mlp.experts.61.gate_proj", "model.layers.10.mlp.experts.62.gate_proj", "model.layers.10.mlp.experts.63.gate_proj", "model.layers.10.mlp.experts.64.gate_proj", "model.layers.10.mlp.experts.65.gate_proj", "model.layers.10.mlp.experts.66.gate_proj", "model.layers.10.mlp.experts.67.gate_proj", "model.layers.10.mlp.experts.68.gate_proj", "model.layers.10.mlp.experts.69.gate_proj", "model.layers.10.mlp.experts.70.gate_proj", "model.layers.10.mlp.experts.71.gate_proj", "model.layers.10.mlp.experts.72.gate_proj", "model.layers.10.mlp.experts.73.gate_proj", "model.layers.10.mlp.experts.74.gate_proj", "model.layers.10.mlp.experts.75.gate_proj", "model.layers.10.mlp.experts.76.gate_proj", "model.layers.10.mlp.experts.77.gate_proj", "model.layers.10.mlp.experts.78.gate_proj", "model.layers.10.mlp.experts.79.gate_proj", "model.layers.10.mlp.experts.80.gate_proj", "model.layers.10.mlp.experts.81.gate_proj", "model.layers.10.mlp.experts.82.gate_proj", "model.layers.10.mlp.experts.83.gate_proj", "model.layers.10.mlp.experts.84.gate_proj", "model.layers.10.mlp.experts.85.gate_proj", "model.layers.10.mlp.experts.86.gate_proj", "model.layers.10.mlp.experts.87.gate_proj", "model.layers.10.mlp.experts.88.gate_proj", "model.layers.10.mlp.experts.89.gate_proj", "model.layers.10.mlp.experts.90.gate_proj", "model.layers.10.mlp.experts.91.gate_proj", "model.layers.10.mlp.experts.92.gate_proj", "model.layers.10.mlp.experts.93.gate_proj", "model.layers.10.mlp.experts.94.gate_proj", "model.layers.10.mlp.experts.95.gate_proj", "model.layers.10.mlp.experts.96.gate_proj", "model.layers.10.mlp.experts.97.gate_proj", "model.layers.10.mlp.experts.98.gate_proj", "model.layers.10.mlp.experts.99.gate_proj", "model.layers.10.mlp.experts.100.gate_proj", "model.layers.10.mlp.experts.101.gate_proj", "model.layers.10.mlp.experts.102.gate_proj", "model.layers.10.mlp.experts.103.gate_proj", "model.layers.10.mlp.experts.104.gate_proj", "model.layers.10.mlp.experts.105.gate_proj", "model.layers.10.mlp.experts.106.gate_proj", "model.layers.10.mlp.experts.107.gate_proj", "model.layers.10.mlp.experts.108.gate_proj", "model.layers.10.mlp.experts.109.gate_proj", "model.layers.10.mlp.experts.110.gate_proj", "model.layers.10.mlp.experts.111.gate_proj", "model.layers.10.mlp.experts.112.gate_proj", "model.layers.10.mlp.experts.113.gate_proj", "model.layers.10.mlp.experts.114.gate_proj", "model.layers.10.mlp.experts.115.gate_proj", "model.layers.10.mlp.experts.116.gate_proj", "model.layers.10.mlp.experts.117.gate_proj", "model.layers.10.mlp.experts.118.gate_proj", "model.layers.10.mlp.experts.119.gate_proj", "model.layers.10.mlp.experts.120.gate_proj", "model.layers.10.mlp.experts.121.gate_proj", "model.layers.10.mlp.experts.122.gate_proj", "model.layers.10.mlp.experts.123.gate_proj", "model.layers.10.mlp.experts.124.gate_proj", "model.layers.10.mlp.experts.125.gate_proj", "model.layers.10.mlp.experts.126.gate_proj", "model.layers.10.mlp.experts.127.gate_proj", "model.layers.10.mlp.experts.128.gate_proj", "model.layers.10.mlp.experts.129.gate_proj", "model.layers.10.mlp.experts.130.gate_proj", "model.layers.10.mlp.experts.131.gate_proj", "model.layers.10.mlp.experts.132.gate_proj", "model.layers.10.mlp.experts.133.gate_proj", "model.layers.10.mlp.experts.134.gate_proj", "model.layers.10.mlp.experts.135.gate_proj", "model.layers.10.mlp.experts.136.gate_proj", "model.layers.10.mlp.experts.137.gate_proj", "model.layers.10.mlp.experts.138.gate_proj", "model.layers.10.mlp.experts.139.gate_proj", "model.layers.10.mlp.experts.140.gate_proj", "model.layers.10.mlp.experts.141.gate_proj", "model.layers.10.mlp.experts.142.gate_proj", "model.layers.10.mlp.experts.143.gate_proj", "model.layers.10.mlp.experts.144.gate_proj", "model.layers.10.mlp.experts.145.gate_proj", "model.layers.10.mlp.experts.146.gate_proj", "model.layers.10.mlp.experts.147.gate_proj", "model.layers.10.mlp.experts.148.gate_proj", "model.layers.10.mlp.experts.149.gate_proj", "model.layers.10.mlp.experts.150.gate_proj", "model.layers.10.mlp.experts.151.gate_proj", "model.layers.10.mlp.experts.152.gate_proj", "model.layers.10.mlp.experts.153.gate_proj", "model.layers.10.mlp.experts.154.gate_proj", "model.layers.10.mlp.experts.155.gate_proj", "model.layers.10.mlp.experts.156.gate_proj", "model.layers.10.mlp.experts.157.gate_proj", "model.layers.10.mlp.experts.158.gate_proj", "model.layers.10.mlp.experts.159.gate_proj", "model.layers.10.mlp.experts.0.up_proj", "model.layers.10.mlp.experts.1.up_proj", "model.layers.10.mlp.experts.2.up_proj", "model.layers.10.mlp.experts.3.up_proj", "model.layers.10.mlp.experts.4.up_proj", "model.layers.10.mlp.experts.5.up_proj", "model.layers.10.mlp.experts.6.up_proj", "model.layers.10.mlp.experts.7.up_proj", "model.layers.10.mlp.experts.8.up_proj", "model.layers.10.mlp.experts.9.up_proj", "model.layers.10.mlp.experts.10.up_proj", "model.layers.10.mlp.experts.11.up_proj", "model.layers.10.mlp.experts.12.up_proj", "model.layers.10.mlp.experts.13.up_proj", "model.layers.10.mlp.experts.14.up_proj", "model.layers.10.mlp.experts.15.up_proj", "model.layers.10.mlp.experts.16.up_proj", "model.layers.10.mlp.experts.17.up_proj", "model.layers.10.mlp.experts.18.up_proj", "model.layers.10.mlp.experts.19.up_proj", "model.layers.10.mlp.experts.20.up_proj", "model.layers.10.mlp.experts.21.up_proj", "model.layers.10.mlp.experts.22.up_proj", "model.layers.10.mlp.experts.23.up_proj", "model.layers.10.mlp.experts.24.up_proj", "model.layers.10.mlp.experts.25.up_proj", "model.layers.10.mlp.experts.26.up_proj", "model.layers.10.mlp.experts.27.up_proj", "model.layers.10.mlp.experts.28.up_proj", "model.layers.10.mlp.experts.29.up_proj", "model.layers.10.mlp.experts.30.up_proj", "model.layers.10.mlp.experts.31.up_proj", "model.layers.10.mlp.experts.32.up_proj", "model.layers.10.mlp.experts.33.up_proj", "model.layers.10.mlp.experts.34.up_proj", "model.layers.10.mlp.experts.35.up_proj", "model.layers.10.mlp.experts.36.up_proj", "model.layers.10.mlp.experts.37.up_proj", "model.layers.10.mlp.experts.38.up_proj", "model.layers.10.mlp.experts.39.up_proj", "model.layers.10.mlp.experts.40.up_proj", "model.layers.10.mlp.experts.41.up_proj", "model.layers.10.mlp.experts.42.up_proj", "model.layers.10.mlp.experts.43.up_proj", "model.layers.10.mlp.experts.44.up_proj", "model.layers.10.mlp.experts.45.up_proj", "model.layers.10.mlp.experts.46.up_proj", "model.layers.10.mlp.experts.47.up_proj", "model.layers.10.mlp.experts.48.up_proj", "model.layers.10.mlp.experts.49.up_proj", "model.layers.10.mlp.experts.50.up_proj", "model.layers.10.mlp.experts.51.up_proj", "model.layers.10.mlp.experts.52.up_proj", "model.layers.10.mlp.experts.53.up_proj", "model.layers.10.mlp.experts.54.up_proj", "model.layers.10.mlp.experts.55.up_proj", "model.layers.10.mlp.experts.56.up_proj", "model.layers.10.mlp.experts.57.up_proj", "model.layers.10.mlp.experts.58.up_proj", "model.layers.10.mlp.experts.59.up_proj", "model.layers.10.mlp.experts.60.up_proj", "model.layers.10.mlp.experts.61.up_proj", "model.layers.10.mlp.experts.62.up_proj", "model.layers.10.mlp.experts.63.up_proj", "model.layers.10.mlp.experts.64.up_proj", "model.layers.10.mlp.experts.65.up_proj", "model.layers.10.mlp.experts.66.up_proj", "model.layers.10.mlp.experts.67.up_proj", "model.layers.10.mlp.experts.68.up_proj", "model.layers.10.mlp.experts.69.up_proj", "model.layers.10.mlp.experts.70.up_proj", "model.layers.10.mlp.experts.71.up_proj", "model.layers.10.mlp.experts.72.up_proj", "model.layers.10.mlp.experts.73.up_proj", "model.layers.10.mlp.experts.74.up_proj", "model.layers.10.mlp.experts.75.up_proj", "model.layers.10.mlp.experts.76.up_proj", "model.layers.10.mlp.experts.77.up_proj", "model.layers.10.mlp.experts.78.up_proj", "model.layers.10.mlp.experts.79.up_proj", "model.layers.10.mlp.experts.80.up_proj", "model.layers.10.mlp.experts.81.up_proj", "model.layers.10.mlp.experts.82.up_proj", "model.layers.10.mlp.experts.83.up_proj", "model.layers.10.mlp.experts.84.up_proj", "model.layers.10.mlp.experts.85.up_proj", "model.layers.10.mlp.experts.86.up_proj", "model.layers.10.mlp.experts.87.up_proj", "model.layers.10.mlp.experts.88.up_proj", "model.layers.10.mlp.experts.89.up_proj", "model.layers.10.mlp.experts.90.up_proj", "model.layers.10.mlp.experts.91.up_proj", "model.layers.10.mlp.experts.92.up_proj", "model.layers.10.mlp.experts.93.up_proj", "model.layers.10.mlp.experts.94.up_proj", "model.layers.10.mlp.experts.95.up_proj", "model.layers.10.mlp.experts.96.up_proj", "model.layers.10.mlp.experts.97.up_proj", "model.layers.10.mlp.experts.98.up_proj", "model.layers.10.mlp.experts.99.up_proj", "model.layers.10.mlp.experts.100.up_proj", "model.layers.10.mlp.experts.101.up_proj", "model.layers.10.mlp.experts.102.up_proj", "model.layers.10.mlp.experts.103.up_proj", "model.layers.10.mlp.experts.104.up_proj", "model.layers.10.mlp.experts.105.up_proj", "model.layers.10.mlp.experts.106.up_proj", "model.layers.10.mlp.experts.107.up_proj", "model.layers.10.mlp.experts.108.up_proj", "model.layers.10.mlp.experts.109.up_proj", "model.layers.10.mlp.experts.110.up_proj", "model.layers.10.mlp.experts.111.up_proj", "model.layers.10.mlp.experts.112.up_proj", "model.layers.10.mlp.experts.113.up_proj", "model.layers.10.mlp.experts.114.up_proj", "model.layers.10.mlp.experts.115.up_proj", "model.layers.10.mlp.experts.116.up_proj", "model.layers.10.mlp.experts.117.up_proj", "model.layers.10.mlp.experts.118.up_proj", "model.layers.10.mlp.experts.119.up_proj", "model.layers.10.mlp.experts.120.up_proj", "model.layers.10.mlp.experts.121.up_proj", "model.layers.10.mlp.experts.122.up_proj", "model.layers.10.mlp.experts.123.up_proj", "model.layers.10.mlp.experts.124.up_proj", "model.layers.10.mlp.experts.125.up_proj", "model.layers.10.mlp.experts.126.up_proj", "model.layers.10.mlp.experts.127.up_proj", "model.layers.10.mlp.experts.128.up_proj", "model.layers.10.mlp.experts.129.up_proj", "model.layers.10.mlp.experts.130.up_proj", "model.layers.10.mlp.experts.131.up_proj", "model.layers.10.mlp.experts.132.up_proj", "model.layers.10.mlp.experts.133.up_proj", "model.layers.10.mlp.experts.134.up_proj", "model.layers.10.mlp.experts.135.up_proj", "model.layers.10.mlp.experts.136.up_proj", "model.layers.10.mlp.experts.137.up_proj", "model.layers.10.mlp.experts.138.up_proj", "model.layers.10.mlp.experts.139.up_proj", "model.layers.10.mlp.experts.140.up_proj", "model.layers.10.mlp.experts.141.up_proj", "model.layers.10.mlp.experts.142.up_proj", "model.layers.10.mlp.experts.143.up_proj", "model.layers.10.mlp.experts.144.up_proj", "model.layers.10.mlp.experts.145.up_proj", "model.layers.10.mlp.experts.146.up_proj", "model.layers.10.mlp.experts.147.up_proj", "model.layers.10.mlp.experts.148.up_proj", "model.layers.10.mlp.experts.149.up_proj", "model.layers.10.mlp.experts.150.up_proj", "model.layers.10.mlp.experts.151.up_proj", "model.layers.10.mlp.experts.152.up_proj", "model.layers.10.mlp.experts.153.up_proj", "model.layers.10.mlp.experts.154.up_proj", "model.layers.10.mlp.experts.155.up_proj", "model.layers.10.mlp.experts.156.up_proj", "model.layers.10.mlp.experts.157.up_proj", "model.layers.10.mlp.experts.158.up_proj", "model.layers.10.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -4.8227724619209766e-05, "dbits": 2516582400 }, { "dkld": -9.180167689919368e-05, "dbits": 5033164800 } ] }, { "idx": 62, "layers": [ "model.layers.10.mlp.experts.0.down_proj", "model.layers.10.mlp.experts.1.down_proj", "model.layers.10.mlp.experts.2.down_proj", "model.layers.10.mlp.experts.3.down_proj", "model.layers.10.mlp.experts.4.down_proj", "model.layers.10.mlp.experts.5.down_proj", "model.layers.10.mlp.experts.6.down_proj", "model.layers.10.mlp.experts.7.down_proj", "model.layers.10.mlp.experts.8.down_proj", "model.layers.10.mlp.experts.9.down_proj", "model.layers.10.mlp.experts.10.down_proj", "model.layers.10.mlp.experts.11.down_proj", "model.layers.10.mlp.experts.12.down_proj", "model.layers.10.mlp.experts.13.down_proj", "model.layers.10.mlp.experts.14.down_proj", "model.layers.10.mlp.experts.15.down_proj", "model.layers.10.mlp.experts.16.down_proj", "model.layers.10.mlp.experts.17.down_proj", "model.layers.10.mlp.experts.18.down_proj", "model.layers.10.mlp.experts.19.down_proj", "model.layers.10.mlp.experts.20.down_proj", "model.layers.10.mlp.experts.21.down_proj", "model.layers.10.mlp.experts.22.down_proj", "model.layers.10.mlp.experts.23.down_proj", "model.layers.10.mlp.experts.24.down_proj", "model.layers.10.mlp.experts.25.down_proj", "model.layers.10.mlp.experts.26.down_proj", "model.layers.10.mlp.experts.27.down_proj", "model.layers.10.mlp.experts.28.down_proj", "model.layers.10.mlp.experts.29.down_proj", "model.layers.10.mlp.experts.30.down_proj", "model.layers.10.mlp.experts.31.down_proj", "model.layers.10.mlp.experts.32.down_proj", "model.layers.10.mlp.experts.33.down_proj", "model.layers.10.mlp.experts.34.down_proj", "model.layers.10.mlp.experts.35.down_proj", "model.layers.10.mlp.experts.36.down_proj", "model.layers.10.mlp.experts.37.down_proj", "model.layers.10.mlp.experts.38.down_proj", "model.layers.10.mlp.experts.39.down_proj", "model.layers.10.mlp.experts.40.down_proj", "model.layers.10.mlp.experts.41.down_proj", "model.layers.10.mlp.experts.42.down_proj", "model.layers.10.mlp.experts.43.down_proj", "model.layers.10.mlp.experts.44.down_proj", "model.layers.10.mlp.experts.45.down_proj", "model.layers.10.mlp.experts.46.down_proj", "model.layers.10.mlp.experts.47.down_proj", "model.layers.10.mlp.experts.48.down_proj", "model.layers.10.mlp.experts.49.down_proj", "model.layers.10.mlp.experts.50.down_proj", "model.layers.10.mlp.experts.51.down_proj", "model.layers.10.mlp.experts.52.down_proj", "model.layers.10.mlp.experts.53.down_proj", "model.layers.10.mlp.experts.54.down_proj", "model.layers.10.mlp.experts.55.down_proj", "model.layers.10.mlp.experts.56.down_proj", "model.layers.10.mlp.experts.57.down_proj", "model.layers.10.mlp.experts.58.down_proj", "model.layers.10.mlp.experts.59.down_proj", "model.layers.10.mlp.experts.60.down_proj", "model.layers.10.mlp.experts.61.down_proj", "model.layers.10.mlp.experts.62.down_proj", "model.layers.10.mlp.experts.63.down_proj", "model.layers.10.mlp.experts.64.down_proj", "model.layers.10.mlp.experts.65.down_proj", "model.layers.10.mlp.experts.66.down_proj", "model.layers.10.mlp.experts.67.down_proj", "model.layers.10.mlp.experts.68.down_proj", "model.layers.10.mlp.experts.69.down_proj", "model.layers.10.mlp.experts.70.down_proj", "model.layers.10.mlp.experts.71.down_proj", "model.layers.10.mlp.experts.72.down_proj", "model.layers.10.mlp.experts.73.down_proj", "model.layers.10.mlp.experts.74.down_proj", "model.layers.10.mlp.experts.75.down_proj", "model.layers.10.mlp.experts.76.down_proj", "model.layers.10.mlp.experts.77.down_proj", "model.layers.10.mlp.experts.78.down_proj", "model.layers.10.mlp.experts.79.down_proj", "model.layers.10.mlp.experts.80.down_proj", "model.layers.10.mlp.experts.81.down_proj", "model.layers.10.mlp.experts.82.down_proj", "model.layers.10.mlp.experts.83.down_proj", "model.layers.10.mlp.experts.84.down_proj", "model.layers.10.mlp.experts.85.down_proj", "model.layers.10.mlp.experts.86.down_proj", "model.layers.10.mlp.experts.87.down_proj", "model.layers.10.mlp.experts.88.down_proj", "model.layers.10.mlp.experts.89.down_proj", "model.layers.10.mlp.experts.90.down_proj", "model.layers.10.mlp.experts.91.down_proj", "model.layers.10.mlp.experts.92.down_proj", "model.layers.10.mlp.experts.93.down_proj", "model.layers.10.mlp.experts.94.down_proj", "model.layers.10.mlp.experts.95.down_proj", "model.layers.10.mlp.experts.96.down_proj", "model.layers.10.mlp.experts.97.down_proj", "model.layers.10.mlp.experts.98.down_proj", "model.layers.10.mlp.experts.99.down_proj", "model.layers.10.mlp.experts.100.down_proj", "model.layers.10.mlp.experts.101.down_proj", "model.layers.10.mlp.experts.102.down_proj", "model.layers.10.mlp.experts.103.down_proj", "model.layers.10.mlp.experts.104.down_proj", "model.layers.10.mlp.experts.105.down_proj", "model.layers.10.mlp.experts.106.down_proj", "model.layers.10.mlp.experts.107.down_proj", "model.layers.10.mlp.experts.108.down_proj", "model.layers.10.mlp.experts.109.down_proj", "model.layers.10.mlp.experts.110.down_proj", "model.layers.10.mlp.experts.111.down_proj", "model.layers.10.mlp.experts.112.down_proj", "model.layers.10.mlp.experts.113.down_proj", "model.layers.10.mlp.experts.114.down_proj", "model.layers.10.mlp.experts.115.down_proj", "model.layers.10.mlp.experts.116.down_proj", "model.layers.10.mlp.experts.117.down_proj", "model.layers.10.mlp.experts.118.down_proj", "model.layers.10.mlp.experts.119.down_proj", "model.layers.10.mlp.experts.120.down_proj", "model.layers.10.mlp.experts.121.down_proj", "model.layers.10.mlp.experts.122.down_proj", "model.layers.10.mlp.experts.123.down_proj", "model.layers.10.mlp.experts.124.down_proj", "model.layers.10.mlp.experts.125.down_proj", "model.layers.10.mlp.experts.126.down_proj", "model.layers.10.mlp.experts.127.down_proj", "model.layers.10.mlp.experts.128.down_proj", "model.layers.10.mlp.experts.129.down_proj", "model.layers.10.mlp.experts.130.down_proj", "model.layers.10.mlp.experts.131.down_proj", "model.layers.10.mlp.experts.132.down_proj", "model.layers.10.mlp.experts.133.down_proj", "model.layers.10.mlp.experts.134.down_proj", "model.layers.10.mlp.experts.135.down_proj", "model.layers.10.mlp.experts.136.down_proj", "model.layers.10.mlp.experts.137.down_proj", "model.layers.10.mlp.experts.138.down_proj", "model.layers.10.mlp.experts.139.down_proj", "model.layers.10.mlp.experts.140.down_proj", "model.layers.10.mlp.experts.141.down_proj", "model.layers.10.mlp.experts.142.down_proj", "model.layers.10.mlp.experts.143.down_proj", "model.layers.10.mlp.experts.144.down_proj", "model.layers.10.mlp.experts.145.down_proj", "model.layers.10.mlp.experts.146.down_proj", "model.layers.10.mlp.experts.147.down_proj", "model.layers.10.mlp.experts.148.down_proj", "model.layers.10.mlp.experts.149.down_proj", "model.layers.10.mlp.experts.150.down_proj", "model.layers.10.mlp.experts.151.down_proj", "model.layers.10.mlp.experts.152.down_proj", "model.layers.10.mlp.experts.153.down_proj", "model.layers.10.mlp.experts.154.down_proj", "model.layers.10.mlp.experts.155.down_proj", "model.layers.10.mlp.experts.156.down_proj", "model.layers.10.mlp.experts.157.down_proj", "model.layers.10.mlp.experts.158.down_proj", "model.layers.10.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -4.782089963555232e-05, "dbits": 1258291200 }, { "dkld": -6.608208641409839e-05, "dbits": 2516582400 } ] }, { "idx": 63, "layers": [ "model.layers.11.self_attn.q_proj" ], "candidates": [ { "dkld": -8.321211207657983e-05, "dbits": 62914560 }, { "dkld": -2.5393441319465637e-05, "dbits": 125829120 } ] }, { "idx": 64, "layers": [ "model.layers.11.self_attn.k_proj", "model.layers.11.self_attn.v_proj" ], "candidates": [ { "dkld": 8.112571667879924e-05, "dbits": 10485760 }, { "dkld": 7.938868366181955e-05, "dbits": 20971520 } ] }, { "idx": 65, "layers": [ "model.layers.11.self_attn.o_proj" ], "candidates": [ { "dkld": -0.0003075837390497313, "dbits": 62914560 }, { "dkld": -0.00031663747504353384, "dbits": 125829120 } ] }, { "idx": 66, "layers": [ "model.layers.11.mlp.shared_experts.gate_proj", "model.layers.11.mlp.shared_experts.up_proj", "model.layers.11.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -4.193924833089009e-05, "dbits": 23592960 }, { "dkld": 3.067892976105213e-06, "dbits": 47185920 } ] }, { "idx": 67, "layers": [ "model.layers.11.mlp.experts.0.gate_proj", "model.layers.11.mlp.experts.1.gate_proj", "model.layers.11.mlp.experts.2.gate_proj", "model.layers.11.mlp.experts.3.gate_proj", "model.layers.11.mlp.experts.4.gate_proj", "model.layers.11.mlp.experts.5.gate_proj", "model.layers.11.mlp.experts.6.gate_proj", "model.layers.11.mlp.experts.7.gate_proj", "model.layers.11.mlp.experts.8.gate_proj", "model.layers.11.mlp.experts.9.gate_proj", "model.layers.11.mlp.experts.10.gate_proj", "model.layers.11.mlp.experts.11.gate_proj", "model.layers.11.mlp.experts.12.gate_proj", "model.layers.11.mlp.experts.13.gate_proj", "model.layers.11.mlp.experts.14.gate_proj", "model.layers.11.mlp.experts.15.gate_proj", "model.layers.11.mlp.experts.16.gate_proj", "model.layers.11.mlp.experts.17.gate_proj", "model.layers.11.mlp.experts.18.gate_proj", "model.layers.11.mlp.experts.19.gate_proj", "model.layers.11.mlp.experts.20.gate_proj", "model.layers.11.mlp.experts.21.gate_proj", "model.layers.11.mlp.experts.22.gate_proj", "model.layers.11.mlp.experts.23.gate_proj", "model.layers.11.mlp.experts.24.gate_proj", "model.layers.11.mlp.experts.25.gate_proj", "model.layers.11.mlp.experts.26.gate_proj", "model.layers.11.mlp.experts.27.gate_proj", "model.layers.11.mlp.experts.28.gate_proj", "model.layers.11.mlp.experts.29.gate_proj", "model.layers.11.mlp.experts.30.gate_proj", "model.layers.11.mlp.experts.31.gate_proj", "model.layers.11.mlp.experts.32.gate_proj", "model.layers.11.mlp.experts.33.gate_proj", "model.layers.11.mlp.experts.34.gate_proj", "model.layers.11.mlp.experts.35.gate_proj", "model.layers.11.mlp.experts.36.gate_proj", "model.layers.11.mlp.experts.37.gate_proj", "model.layers.11.mlp.experts.38.gate_proj", "model.layers.11.mlp.experts.39.gate_proj", "model.layers.11.mlp.experts.40.gate_proj", "model.layers.11.mlp.experts.41.gate_proj", "model.layers.11.mlp.experts.42.gate_proj", "model.layers.11.mlp.experts.43.gate_proj", "model.layers.11.mlp.experts.44.gate_proj", "model.layers.11.mlp.experts.45.gate_proj", "model.layers.11.mlp.experts.46.gate_proj", "model.layers.11.mlp.experts.47.gate_proj", "model.layers.11.mlp.experts.48.gate_proj", "model.layers.11.mlp.experts.49.gate_proj", "model.layers.11.mlp.experts.50.gate_proj", "model.layers.11.mlp.experts.51.gate_proj", "model.layers.11.mlp.experts.52.gate_proj", "model.layers.11.mlp.experts.53.gate_proj", "model.layers.11.mlp.experts.54.gate_proj", "model.layers.11.mlp.experts.55.gate_proj", "model.layers.11.mlp.experts.56.gate_proj", "model.layers.11.mlp.experts.57.gate_proj", "model.layers.11.mlp.experts.58.gate_proj", "model.layers.11.mlp.experts.59.gate_proj", "model.layers.11.mlp.experts.60.gate_proj", "model.layers.11.mlp.experts.61.gate_proj", "model.layers.11.mlp.experts.62.gate_proj", "model.layers.11.mlp.experts.63.gate_proj", "model.layers.11.mlp.experts.64.gate_proj", "model.layers.11.mlp.experts.65.gate_proj", "model.layers.11.mlp.experts.66.gate_proj", "model.layers.11.mlp.experts.67.gate_proj", "model.layers.11.mlp.experts.68.gate_proj", "model.layers.11.mlp.experts.69.gate_proj", "model.layers.11.mlp.experts.70.gate_proj", "model.layers.11.mlp.experts.71.gate_proj", "model.layers.11.mlp.experts.72.gate_proj", "model.layers.11.mlp.experts.73.gate_proj", "model.layers.11.mlp.experts.74.gate_proj", "model.layers.11.mlp.experts.75.gate_proj", "model.layers.11.mlp.experts.76.gate_proj", "model.layers.11.mlp.experts.77.gate_proj", "model.layers.11.mlp.experts.78.gate_proj", "model.layers.11.mlp.experts.79.gate_proj", "model.layers.11.mlp.experts.80.gate_proj", "model.layers.11.mlp.experts.81.gate_proj", "model.layers.11.mlp.experts.82.gate_proj", "model.layers.11.mlp.experts.83.gate_proj", "model.layers.11.mlp.experts.84.gate_proj", "model.layers.11.mlp.experts.85.gate_proj", "model.layers.11.mlp.experts.86.gate_proj", "model.layers.11.mlp.experts.87.gate_proj", "model.layers.11.mlp.experts.88.gate_proj", "model.layers.11.mlp.experts.89.gate_proj", "model.layers.11.mlp.experts.90.gate_proj", "model.layers.11.mlp.experts.91.gate_proj", "model.layers.11.mlp.experts.92.gate_proj", "model.layers.11.mlp.experts.93.gate_proj", "model.layers.11.mlp.experts.94.gate_proj", "model.layers.11.mlp.experts.95.gate_proj", "model.layers.11.mlp.experts.96.gate_proj", "model.layers.11.mlp.experts.97.gate_proj", "model.layers.11.mlp.experts.98.gate_proj", "model.layers.11.mlp.experts.99.gate_proj", "model.layers.11.mlp.experts.100.gate_proj", "model.layers.11.mlp.experts.101.gate_proj", "model.layers.11.mlp.experts.102.gate_proj", "model.layers.11.mlp.experts.103.gate_proj", "model.layers.11.mlp.experts.104.gate_proj", "model.layers.11.mlp.experts.105.gate_proj", "model.layers.11.mlp.experts.106.gate_proj", "model.layers.11.mlp.experts.107.gate_proj", "model.layers.11.mlp.experts.108.gate_proj", "model.layers.11.mlp.experts.109.gate_proj", "model.layers.11.mlp.experts.110.gate_proj", "model.layers.11.mlp.experts.111.gate_proj", "model.layers.11.mlp.experts.112.gate_proj", "model.layers.11.mlp.experts.113.gate_proj", "model.layers.11.mlp.experts.114.gate_proj", "model.layers.11.mlp.experts.115.gate_proj", "model.layers.11.mlp.experts.116.gate_proj", "model.layers.11.mlp.experts.117.gate_proj", "model.layers.11.mlp.experts.118.gate_proj", "model.layers.11.mlp.experts.119.gate_proj", "model.layers.11.mlp.experts.120.gate_proj", "model.layers.11.mlp.experts.121.gate_proj", "model.layers.11.mlp.experts.122.gate_proj", "model.layers.11.mlp.experts.123.gate_proj", "model.layers.11.mlp.experts.124.gate_proj", "model.layers.11.mlp.experts.125.gate_proj", "model.layers.11.mlp.experts.126.gate_proj", "model.layers.11.mlp.experts.127.gate_proj", "model.layers.11.mlp.experts.128.gate_proj", "model.layers.11.mlp.experts.129.gate_proj", "model.layers.11.mlp.experts.130.gate_proj", "model.layers.11.mlp.experts.131.gate_proj", "model.layers.11.mlp.experts.132.gate_proj", "model.layers.11.mlp.experts.133.gate_proj", "model.layers.11.mlp.experts.134.gate_proj", "model.layers.11.mlp.experts.135.gate_proj", "model.layers.11.mlp.experts.136.gate_proj", "model.layers.11.mlp.experts.137.gate_proj", "model.layers.11.mlp.experts.138.gate_proj", "model.layers.11.mlp.experts.139.gate_proj", "model.layers.11.mlp.experts.140.gate_proj", "model.layers.11.mlp.experts.141.gate_proj", "model.layers.11.mlp.experts.142.gate_proj", "model.layers.11.mlp.experts.143.gate_proj", "model.layers.11.mlp.experts.144.gate_proj", "model.layers.11.mlp.experts.145.gate_proj", "model.layers.11.mlp.experts.146.gate_proj", "model.layers.11.mlp.experts.147.gate_proj", "model.layers.11.mlp.experts.148.gate_proj", "model.layers.11.mlp.experts.149.gate_proj", "model.layers.11.mlp.experts.150.gate_proj", "model.layers.11.mlp.experts.151.gate_proj", "model.layers.11.mlp.experts.152.gate_proj", "model.layers.11.mlp.experts.153.gate_proj", "model.layers.11.mlp.experts.154.gate_proj", "model.layers.11.mlp.experts.155.gate_proj", "model.layers.11.mlp.experts.156.gate_proj", "model.layers.11.mlp.experts.157.gate_proj", "model.layers.11.mlp.experts.158.gate_proj", "model.layers.11.mlp.experts.159.gate_proj", "model.layers.11.mlp.experts.0.up_proj", "model.layers.11.mlp.experts.1.up_proj", "model.layers.11.mlp.experts.2.up_proj", "model.layers.11.mlp.experts.3.up_proj", "model.layers.11.mlp.experts.4.up_proj", "model.layers.11.mlp.experts.5.up_proj", "model.layers.11.mlp.experts.6.up_proj", "model.layers.11.mlp.experts.7.up_proj", "model.layers.11.mlp.experts.8.up_proj", "model.layers.11.mlp.experts.9.up_proj", "model.layers.11.mlp.experts.10.up_proj", "model.layers.11.mlp.experts.11.up_proj", "model.layers.11.mlp.experts.12.up_proj", "model.layers.11.mlp.experts.13.up_proj", "model.layers.11.mlp.experts.14.up_proj", "model.layers.11.mlp.experts.15.up_proj", "model.layers.11.mlp.experts.16.up_proj", "model.layers.11.mlp.experts.17.up_proj", "model.layers.11.mlp.experts.18.up_proj", "model.layers.11.mlp.experts.19.up_proj", "model.layers.11.mlp.experts.20.up_proj", "model.layers.11.mlp.experts.21.up_proj", "model.layers.11.mlp.experts.22.up_proj", "model.layers.11.mlp.experts.23.up_proj", "model.layers.11.mlp.experts.24.up_proj", "model.layers.11.mlp.experts.25.up_proj", "model.layers.11.mlp.experts.26.up_proj", "model.layers.11.mlp.experts.27.up_proj", "model.layers.11.mlp.experts.28.up_proj", "model.layers.11.mlp.experts.29.up_proj", "model.layers.11.mlp.experts.30.up_proj", "model.layers.11.mlp.experts.31.up_proj", "model.layers.11.mlp.experts.32.up_proj", "model.layers.11.mlp.experts.33.up_proj", "model.layers.11.mlp.experts.34.up_proj", "model.layers.11.mlp.experts.35.up_proj", "model.layers.11.mlp.experts.36.up_proj", "model.layers.11.mlp.experts.37.up_proj", "model.layers.11.mlp.experts.38.up_proj", "model.layers.11.mlp.experts.39.up_proj", "model.layers.11.mlp.experts.40.up_proj", "model.layers.11.mlp.experts.41.up_proj", "model.layers.11.mlp.experts.42.up_proj", "model.layers.11.mlp.experts.43.up_proj", "model.layers.11.mlp.experts.44.up_proj", "model.layers.11.mlp.experts.45.up_proj", "model.layers.11.mlp.experts.46.up_proj", "model.layers.11.mlp.experts.47.up_proj", "model.layers.11.mlp.experts.48.up_proj", "model.layers.11.mlp.experts.49.up_proj", "model.layers.11.mlp.experts.50.up_proj", "model.layers.11.mlp.experts.51.up_proj", "model.layers.11.mlp.experts.52.up_proj", "model.layers.11.mlp.experts.53.up_proj", "model.layers.11.mlp.experts.54.up_proj", "model.layers.11.mlp.experts.55.up_proj", "model.layers.11.mlp.experts.56.up_proj", "model.layers.11.mlp.experts.57.up_proj", "model.layers.11.mlp.experts.58.up_proj", "model.layers.11.mlp.experts.59.up_proj", "model.layers.11.mlp.experts.60.up_proj", "model.layers.11.mlp.experts.61.up_proj", "model.layers.11.mlp.experts.62.up_proj", "model.layers.11.mlp.experts.63.up_proj", "model.layers.11.mlp.experts.64.up_proj", "model.layers.11.mlp.experts.65.up_proj", "model.layers.11.mlp.experts.66.up_proj", "model.layers.11.mlp.experts.67.up_proj", "model.layers.11.mlp.experts.68.up_proj", "model.layers.11.mlp.experts.69.up_proj", "model.layers.11.mlp.experts.70.up_proj", "model.layers.11.mlp.experts.71.up_proj", "model.layers.11.mlp.experts.72.up_proj", "model.layers.11.mlp.experts.73.up_proj", "model.layers.11.mlp.experts.74.up_proj", "model.layers.11.mlp.experts.75.up_proj", "model.layers.11.mlp.experts.76.up_proj", "model.layers.11.mlp.experts.77.up_proj", "model.layers.11.mlp.experts.78.up_proj", "model.layers.11.mlp.experts.79.up_proj", "model.layers.11.mlp.experts.80.up_proj", "model.layers.11.mlp.experts.81.up_proj", "model.layers.11.mlp.experts.82.up_proj", "model.layers.11.mlp.experts.83.up_proj", "model.layers.11.mlp.experts.84.up_proj", "model.layers.11.mlp.experts.85.up_proj", "model.layers.11.mlp.experts.86.up_proj", "model.layers.11.mlp.experts.87.up_proj", "model.layers.11.mlp.experts.88.up_proj", "model.layers.11.mlp.experts.89.up_proj", "model.layers.11.mlp.experts.90.up_proj", "model.layers.11.mlp.experts.91.up_proj", "model.layers.11.mlp.experts.92.up_proj", "model.layers.11.mlp.experts.93.up_proj", "model.layers.11.mlp.experts.94.up_proj", "model.layers.11.mlp.experts.95.up_proj", "model.layers.11.mlp.experts.96.up_proj", "model.layers.11.mlp.experts.97.up_proj", "model.layers.11.mlp.experts.98.up_proj", "model.layers.11.mlp.experts.99.up_proj", "model.layers.11.mlp.experts.100.up_proj", "model.layers.11.mlp.experts.101.up_proj", "model.layers.11.mlp.experts.102.up_proj", "model.layers.11.mlp.experts.103.up_proj", "model.layers.11.mlp.experts.104.up_proj", "model.layers.11.mlp.experts.105.up_proj", "model.layers.11.mlp.experts.106.up_proj", "model.layers.11.mlp.experts.107.up_proj", "model.layers.11.mlp.experts.108.up_proj", "model.layers.11.mlp.experts.109.up_proj", "model.layers.11.mlp.experts.110.up_proj", "model.layers.11.mlp.experts.111.up_proj", "model.layers.11.mlp.experts.112.up_proj", "model.layers.11.mlp.experts.113.up_proj", "model.layers.11.mlp.experts.114.up_proj", "model.layers.11.mlp.experts.115.up_proj", "model.layers.11.mlp.experts.116.up_proj", "model.layers.11.mlp.experts.117.up_proj", "model.layers.11.mlp.experts.118.up_proj", "model.layers.11.mlp.experts.119.up_proj", "model.layers.11.mlp.experts.120.up_proj", "model.layers.11.mlp.experts.121.up_proj", "model.layers.11.mlp.experts.122.up_proj", "model.layers.11.mlp.experts.123.up_proj", "model.layers.11.mlp.experts.124.up_proj", "model.layers.11.mlp.experts.125.up_proj", "model.layers.11.mlp.experts.126.up_proj", "model.layers.11.mlp.experts.127.up_proj", "model.layers.11.mlp.experts.128.up_proj", "model.layers.11.mlp.experts.129.up_proj", "model.layers.11.mlp.experts.130.up_proj", "model.layers.11.mlp.experts.131.up_proj", "model.layers.11.mlp.experts.132.up_proj", "model.layers.11.mlp.experts.133.up_proj", "model.layers.11.mlp.experts.134.up_proj", "model.layers.11.mlp.experts.135.up_proj", "model.layers.11.mlp.experts.136.up_proj", "model.layers.11.mlp.experts.137.up_proj", "model.layers.11.mlp.experts.138.up_proj", "model.layers.11.mlp.experts.139.up_proj", "model.layers.11.mlp.experts.140.up_proj", "model.layers.11.mlp.experts.141.up_proj", "model.layers.11.mlp.experts.142.up_proj", "model.layers.11.mlp.experts.143.up_proj", "model.layers.11.mlp.experts.144.up_proj", "model.layers.11.mlp.experts.145.up_proj", "model.layers.11.mlp.experts.146.up_proj", "model.layers.11.mlp.experts.147.up_proj", "model.layers.11.mlp.experts.148.up_proj", "model.layers.11.mlp.experts.149.up_proj", "model.layers.11.mlp.experts.150.up_proj", "model.layers.11.mlp.experts.151.up_proj", "model.layers.11.mlp.experts.152.up_proj", "model.layers.11.mlp.experts.153.up_proj", "model.layers.11.mlp.experts.154.up_proj", "model.layers.11.mlp.experts.155.up_proj", "model.layers.11.mlp.experts.156.up_proj", "model.layers.11.mlp.experts.157.up_proj", "model.layers.11.mlp.experts.158.up_proj", "model.layers.11.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -5.919302348047356e-05, "dbits": 2516582400 }, { "dkld": -3.5106949508189114e-05, "dbits": 5033164800 } ] }, { "idx": 68, "layers": [ "model.layers.11.mlp.experts.0.down_proj", "model.layers.11.mlp.experts.1.down_proj", "model.layers.11.mlp.experts.2.down_proj", "model.layers.11.mlp.experts.3.down_proj", "model.layers.11.mlp.experts.4.down_proj", "model.layers.11.mlp.experts.5.down_proj", "model.layers.11.mlp.experts.6.down_proj", "model.layers.11.mlp.experts.7.down_proj", "model.layers.11.mlp.experts.8.down_proj", "model.layers.11.mlp.experts.9.down_proj", "model.layers.11.mlp.experts.10.down_proj", "model.layers.11.mlp.experts.11.down_proj", "model.layers.11.mlp.experts.12.down_proj", "model.layers.11.mlp.experts.13.down_proj", "model.layers.11.mlp.experts.14.down_proj", "model.layers.11.mlp.experts.15.down_proj", "model.layers.11.mlp.experts.16.down_proj", "model.layers.11.mlp.experts.17.down_proj", "model.layers.11.mlp.experts.18.down_proj", "model.layers.11.mlp.experts.19.down_proj", "model.layers.11.mlp.experts.20.down_proj", "model.layers.11.mlp.experts.21.down_proj", "model.layers.11.mlp.experts.22.down_proj", "model.layers.11.mlp.experts.23.down_proj", "model.layers.11.mlp.experts.24.down_proj", "model.layers.11.mlp.experts.25.down_proj", "model.layers.11.mlp.experts.26.down_proj", "model.layers.11.mlp.experts.27.down_proj", "model.layers.11.mlp.experts.28.down_proj", "model.layers.11.mlp.experts.29.down_proj", "model.layers.11.mlp.experts.30.down_proj", "model.layers.11.mlp.experts.31.down_proj", "model.layers.11.mlp.experts.32.down_proj", "model.layers.11.mlp.experts.33.down_proj", "model.layers.11.mlp.experts.34.down_proj", "model.layers.11.mlp.experts.35.down_proj", "model.layers.11.mlp.experts.36.down_proj", "model.layers.11.mlp.experts.37.down_proj", "model.layers.11.mlp.experts.38.down_proj", "model.layers.11.mlp.experts.39.down_proj", "model.layers.11.mlp.experts.40.down_proj", "model.layers.11.mlp.experts.41.down_proj", "model.layers.11.mlp.experts.42.down_proj", "model.layers.11.mlp.experts.43.down_proj", "model.layers.11.mlp.experts.44.down_proj", "model.layers.11.mlp.experts.45.down_proj", "model.layers.11.mlp.experts.46.down_proj", "model.layers.11.mlp.experts.47.down_proj", "model.layers.11.mlp.experts.48.down_proj", "model.layers.11.mlp.experts.49.down_proj", "model.layers.11.mlp.experts.50.down_proj", "model.layers.11.mlp.experts.51.down_proj", "model.layers.11.mlp.experts.52.down_proj", "model.layers.11.mlp.experts.53.down_proj", "model.layers.11.mlp.experts.54.down_proj", "model.layers.11.mlp.experts.55.down_proj", "model.layers.11.mlp.experts.56.down_proj", "model.layers.11.mlp.experts.57.down_proj", "model.layers.11.mlp.experts.58.down_proj", "model.layers.11.mlp.experts.59.down_proj", "model.layers.11.mlp.experts.60.down_proj", "model.layers.11.mlp.experts.61.down_proj", "model.layers.11.mlp.experts.62.down_proj", "model.layers.11.mlp.experts.63.down_proj", "model.layers.11.mlp.experts.64.down_proj", "model.layers.11.mlp.experts.65.down_proj", "model.layers.11.mlp.experts.66.down_proj", "model.layers.11.mlp.experts.67.down_proj", "model.layers.11.mlp.experts.68.down_proj", "model.layers.11.mlp.experts.69.down_proj", "model.layers.11.mlp.experts.70.down_proj", "model.layers.11.mlp.experts.71.down_proj", "model.layers.11.mlp.experts.72.down_proj", "model.layers.11.mlp.experts.73.down_proj", "model.layers.11.mlp.experts.74.down_proj", "model.layers.11.mlp.experts.75.down_proj", "model.layers.11.mlp.experts.76.down_proj", "model.layers.11.mlp.experts.77.down_proj", "model.layers.11.mlp.experts.78.down_proj", "model.layers.11.mlp.experts.79.down_proj", "model.layers.11.mlp.experts.80.down_proj", "model.layers.11.mlp.experts.81.down_proj", "model.layers.11.mlp.experts.82.down_proj", "model.layers.11.mlp.experts.83.down_proj", "model.layers.11.mlp.experts.84.down_proj", "model.layers.11.mlp.experts.85.down_proj", "model.layers.11.mlp.experts.86.down_proj", "model.layers.11.mlp.experts.87.down_proj", "model.layers.11.mlp.experts.88.down_proj", "model.layers.11.mlp.experts.89.down_proj", "model.layers.11.mlp.experts.90.down_proj", "model.layers.11.mlp.experts.91.down_proj", "model.layers.11.mlp.experts.92.down_proj", "model.layers.11.mlp.experts.93.down_proj", "model.layers.11.mlp.experts.94.down_proj", "model.layers.11.mlp.experts.95.down_proj", "model.layers.11.mlp.experts.96.down_proj", "model.layers.11.mlp.experts.97.down_proj", "model.layers.11.mlp.experts.98.down_proj", "model.layers.11.mlp.experts.99.down_proj", "model.layers.11.mlp.experts.100.down_proj", "model.layers.11.mlp.experts.101.down_proj", "model.layers.11.mlp.experts.102.down_proj", "model.layers.11.mlp.experts.103.down_proj", "model.layers.11.mlp.experts.104.down_proj", "model.layers.11.mlp.experts.105.down_proj", "model.layers.11.mlp.experts.106.down_proj", "model.layers.11.mlp.experts.107.down_proj", "model.layers.11.mlp.experts.108.down_proj", "model.layers.11.mlp.experts.109.down_proj", "model.layers.11.mlp.experts.110.down_proj", "model.layers.11.mlp.experts.111.down_proj", "model.layers.11.mlp.experts.112.down_proj", "model.layers.11.mlp.experts.113.down_proj", "model.layers.11.mlp.experts.114.down_proj", "model.layers.11.mlp.experts.115.down_proj", "model.layers.11.mlp.experts.116.down_proj", "model.layers.11.mlp.experts.117.down_proj", "model.layers.11.mlp.experts.118.down_proj", "model.layers.11.mlp.experts.119.down_proj", "model.layers.11.mlp.experts.120.down_proj", "model.layers.11.mlp.experts.121.down_proj", "model.layers.11.mlp.experts.122.down_proj", "model.layers.11.mlp.experts.123.down_proj", "model.layers.11.mlp.experts.124.down_proj", "model.layers.11.mlp.experts.125.down_proj", "model.layers.11.mlp.experts.126.down_proj", "model.layers.11.mlp.experts.127.down_proj", "model.layers.11.mlp.experts.128.down_proj", "model.layers.11.mlp.experts.129.down_proj", "model.layers.11.mlp.experts.130.down_proj", "model.layers.11.mlp.experts.131.down_proj", "model.layers.11.mlp.experts.132.down_proj", "model.layers.11.mlp.experts.133.down_proj", "model.layers.11.mlp.experts.134.down_proj", "model.layers.11.mlp.experts.135.down_proj", "model.layers.11.mlp.experts.136.down_proj", "model.layers.11.mlp.experts.137.down_proj", "model.layers.11.mlp.experts.138.down_proj", "model.layers.11.mlp.experts.139.down_proj", "model.layers.11.mlp.experts.140.down_proj", "model.layers.11.mlp.experts.141.down_proj", "model.layers.11.mlp.experts.142.down_proj", "model.layers.11.mlp.experts.143.down_proj", "model.layers.11.mlp.experts.144.down_proj", "model.layers.11.mlp.experts.145.down_proj", "model.layers.11.mlp.experts.146.down_proj", "model.layers.11.mlp.experts.147.down_proj", "model.layers.11.mlp.experts.148.down_proj", "model.layers.11.mlp.experts.149.down_proj", "model.layers.11.mlp.experts.150.down_proj", "model.layers.11.mlp.experts.151.down_proj", "model.layers.11.mlp.experts.152.down_proj", "model.layers.11.mlp.experts.153.down_proj", "model.layers.11.mlp.experts.154.down_proj", "model.layers.11.mlp.experts.155.down_proj", "model.layers.11.mlp.experts.156.down_proj", "model.layers.11.mlp.experts.157.down_proj", "model.layers.11.mlp.experts.158.down_proj", "model.layers.11.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.8818938881158482e-05, "dbits": 1258291200 }, { "dkld": -3.73600283637629e-05, "dbits": 2516582400 } ] }, { "idx": 69, "layers": [ "model.layers.12.self_attn.q_proj" ], "candidates": [ { "dkld": 1.7168186604977695e-05, "dbits": 62914560 }, { "dkld": -1.2699072249232335e-05, "dbits": 125829120 } ] }, { "idx": 70, "layers": [ "model.layers.12.self_attn.k_proj", "model.layers.12.self_attn.v_proj" ], "candidates": [ { "dkld": 0.00013769504148513148, "dbits": 10485760 }, { "dkld": 0.0001357873668894182, "dbits": 20971520 } ] }, { "idx": 71, "layers": [ "model.layers.12.self_attn.o_proj" ], "candidates": [ { "dkld": 5.2645476534963e-05, "dbits": 62914560 }, { "dkld": 5.770074203610524e-05, "dbits": 125829120 } ] }, { "idx": 72, "layers": [ "model.layers.12.mlp.shared_experts.gate_proj", "model.layers.12.mlp.shared_experts.up_proj", "model.layers.12.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -9.504882618784766e-05, "dbits": 23592960 }, { "dkld": -0.00010586925782263279, "dbits": 47185920 } ] }, { "idx": 73, "layers": [ "model.layers.12.mlp.experts.0.gate_proj", "model.layers.12.mlp.experts.1.gate_proj", "model.layers.12.mlp.experts.2.gate_proj", "model.layers.12.mlp.experts.3.gate_proj", "model.layers.12.mlp.experts.4.gate_proj", "model.layers.12.mlp.experts.5.gate_proj", "model.layers.12.mlp.experts.6.gate_proj", "model.layers.12.mlp.experts.7.gate_proj", "model.layers.12.mlp.experts.8.gate_proj", "model.layers.12.mlp.experts.9.gate_proj", "model.layers.12.mlp.experts.10.gate_proj", "model.layers.12.mlp.experts.11.gate_proj", "model.layers.12.mlp.experts.12.gate_proj", "model.layers.12.mlp.experts.13.gate_proj", "model.layers.12.mlp.experts.14.gate_proj", "model.layers.12.mlp.experts.15.gate_proj", "model.layers.12.mlp.experts.16.gate_proj", "model.layers.12.mlp.experts.17.gate_proj", "model.layers.12.mlp.experts.18.gate_proj", "model.layers.12.mlp.experts.19.gate_proj", "model.layers.12.mlp.experts.20.gate_proj", "model.layers.12.mlp.experts.21.gate_proj", "model.layers.12.mlp.experts.22.gate_proj", "model.layers.12.mlp.experts.23.gate_proj", "model.layers.12.mlp.experts.24.gate_proj", "model.layers.12.mlp.experts.25.gate_proj", "model.layers.12.mlp.experts.26.gate_proj", "model.layers.12.mlp.experts.27.gate_proj", "model.layers.12.mlp.experts.28.gate_proj", "model.layers.12.mlp.experts.29.gate_proj", "model.layers.12.mlp.experts.30.gate_proj", "model.layers.12.mlp.experts.31.gate_proj", "model.layers.12.mlp.experts.32.gate_proj", "model.layers.12.mlp.experts.33.gate_proj", "model.layers.12.mlp.experts.34.gate_proj", "model.layers.12.mlp.experts.35.gate_proj", "model.layers.12.mlp.experts.36.gate_proj", "model.layers.12.mlp.experts.37.gate_proj", "model.layers.12.mlp.experts.38.gate_proj", "model.layers.12.mlp.experts.39.gate_proj", "model.layers.12.mlp.experts.40.gate_proj", "model.layers.12.mlp.experts.41.gate_proj", "model.layers.12.mlp.experts.42.gate_proj", "model.layers.12.mlp.experts.43.gate_proj", "model.layers.12.mlp.experts.44.gate_proj", "model.layers.12.mlp.experts.45.gate_proj", "model.layers.12.mlp.experts.46.gate_proj", "model.layers.12.mlp.experts.47.gate_proj", "model.layers.12.mlp.experts.48.gate_proj", "model.layers.12.mlp.experts.49.gate_proj", "model.layers.12.mlp.experts.50.gate_proj", "model.layers.12.mlp.experts.51.gate_proj", "model.layers.12.mlp.experts.52.gate_proj", "model.layers.12.mlp.experts.53.gate_proj", "model.layers.12.mlp.experts.54.gate_proj", "model.layers.12.mlp.experts.55.gate_proj", "model.layers.12.mlp.experts.56.gate_proj", "model.layers.12.mlp.experts.57.gate_proj", "model.layers.12.mlp.experts.58.gate_proj", "model.layers.12.mlp.experts.59.gate_proj", "model.layers.12.mlp.experts.60.gate_proj", "model.layers.12.mlp.experts.61.gate_proj", "model.layers.12.mlp.experts.62.gate_proj", "model.layers.12.mlp.experts.63.gate_proj", "model.layers.12.mlp.experts.64.gate_proj", "model.layers.12.mlp.experts.65.gate_proj", "model.layers.12.mlp.experts.66.gate_proj", "model.layers.12.mlp.experts.67.gate_proj", "model.layers.12.mlp.experts.68.gate_proj", "model.layers.12.mlp.experts.69.gate_proj", "model.layers.12.mlp.experts.70.gate_proj", "model.layers.12.mlp.experts.71.gate_proj", "model.layers.12.mlp.experts.72.gate_proj", "model.layers.12.mlp.experts.73.gate_proj", "model.layers.12.mlp.experts.74.gate_proj", "model.layers.12.mlp.experts.75.gate_proj", "model.layers.12.mlp.experts.76.gate_proj", "model.layers.12.mlp.experts.77.gate_proj", "model.layers.12.mlp.experts.78.gate_proj", "model.layers.12.mlp.experts.79.gate_proj", "model.layers.12.mlp.experts.80.gate_proj", "model.layers.12.mlp.experts.81.gate_proj", "model.layers.12.mlp.experts.82.gate_proj", "model.layers.12.mlp.experts.83.gate_proj", "model.layers.12.mlp.experts.84.gate_proj", "model.layers.12.mlp.experts.85.gate_proj", "model.layers.12.mlp.experts.86.gate_proj", "model.layers.12.mlp.experts.87.gate_proj", "model.layers.12.mlp.experts.88.gate_proj", "model.layers.12.mlp.experts.89.gate_proj", "model.layers.12.mlp.experts.90.gate_proj", "model.layers.12.mlp.experts.91.gate_proj", "model.layers.12.mlp.experts.92.gate_proj", "model.layers.12.mlp.experts.93.gate_proj", "model.layers.12.mlp.experts.94.gate_proj", "model.layers.12.mlp.experts.95.gate_proj", "model.layers.12.mlp.experts.96.gate_proj", "model.layers.12.mlp.experts.97.gate_proj", "model.layers.12.mlp.experts.98.gate_proj", "model.layers.12.mlp.experts.99.gate_proj", "model.layers.12.mlp.experts.100.gate_proj", "model.layers.12.mlp.experts.101.gate_proj", "model.layers.12.mlp.experts.102.gate_proj", "model.layers.12.mlp.experts.103.gate_proj", "model.layers.12.mlp.experts.104.gate_proj", "model.layers.12.mlp.experts.105.gate_proj", "model.layers.12.mlp.experts.106.gate_proj", "model.layers.12.mlp.experts.107.gate_proj", "model.layers.12.mlp.experts.108.gate_proj", "model.layers.12.mlp.experts.109.gate_proj", "model.layers.12.mlp.experts.110.gate_proj", "model.layers.12.mlp.experts.111.gate_proj", "model.layers.12.mlp.experts.112.gate_proj", "model.layers.12.mlp.experts.113.gate_proj", "model.layers.12.mlp.experts.114.gate_proj", "model.layers.12.mlp.experts.115.gate_proj", "model.layers.12.mlp.experts.116.gate_proj", "model.layers.12.mlp.experts.117.gate_proj", "model.layers.12.mlp.experts.118.gate_proj", "model.layers.12.mlp.experts.119.gate_proj", "model.layers.12.mlp.experts.120.gate_proj", "model.layers.12.mlp.experts.121.gate_proj", "model.layers.12.mlp.experts.122.gate_proj", "model.layers.12.mlp.experts.123.gate_proj", "model.layers.12.mlp.experts.124.gate_proj", "model.layers.12.mlp.experts.125.gate_proj", "model.layers.12.mlp.experts.126.gate_proj", "model.layers.12.mlp.experts.127.gate_proj", "model.layers.12.mlp.experts.128.gate_proj", "model.layers.12.mlp.experts.129.gate_proj", "model.layers.12.mlp.experts.130.gate_proj", "model.layers.12.mlp.experts.131.gate_proj", "model.layers.12.mlp.experts.132.gate_proj", "model.layers.12.mlp.experts.133.gate_proj", "model.layers.12.mlp.experts.134.gate_proj", "model.layers.12.mlp.experts.135.gate_proj", "model.layers.12.mlp.experts.136.gate_proj", "model.layers.12.mlp.experts.137.gate_proj", "model.layers.12.mlp.experts.138.gate_proj", "model.layers.12.mlp.experts.139.gate_proj", "model.layers.12.mlp.experts.140.gate_proj", "model.layers.12.mlp.experts.141.gate_proj", "model.layers.12.mlp.experts.142.gate_proj", "model.layers.12.mlp.experts.143.gate_proj", "model.layers.12.mlp.experts.144.gate_proj", "model.layers.12.mlp.experts.145.gate_proj", "model.layers.12.mlp.experts.146.gate_proj", "model.layers.12.mlp.experts.147.gate_proj", "model.layers.12.mlp.experts.148.gate_proj", "model.layers.12.mlp.experts.149.gate_proj", "model.layers.12.mlp.experts.150.gate_proj", "model.layers.12.mlp.experts.151.gate_proj", "model.layers.12.mlp.experts.152.gate_proj", "model.layers.12.mlp.experts.153.gate_proj", "model.layers.12.mlp.experts.154.gate_proj", "model.layers.12.mlp.experts.155.gate_proj", "model.layers.12.mlp.experts.156.gate_proj", "model.layers.12.mlp.experts.157.gate_proj", "model.layers.12.mlp.experts.158.gate_proj", "model.layers.12.mlp.experts.159.gate_proj", "model.layers.12.mlp.experts.0.up_proj", "model.layers.12.mlp.experts.1.up_proj", "model.layers.12.mlp.experts.2.up_proj", "model.layers.12.mlp.experts.3.up_proj", "model.layers.12.mlp.experts.4.up_proj", "model.layers.12.mlp.experts.5.up_proj", "model.layers.12.mlp.experts.6.up_proj", "model.layers.12.mlp.experts.7.up_proj", "model.layers.12.mlp.experts.8.up_proj", "model.layers.12.mlp.experts.9.up_proj", "model.layers.12.mlp.experts.10.up_proj", "model.layers.12.mlp.experts.11.up_proj", "model.layers.12.mlp.experts.12.up_proj", "model.layers.12.mlp.experts.13.up_proj", "model.layers.12.mlp.experts.14.up_proj", "model.layers.12.mlp.experts.15.up_proj", "model.layers.12.mlp.experts.16.up_proj", "model.layers.12.mlp.experts.17.up_proj", "model.layers.12.mlp.experts.18.up_proj", "model.layers.12.mlp.experts.19.up_proj", "model.layers.12.mlp.experts.20.up_proj", "model.layers.12.mlp.experts.21.up_proj", "model.layers.12.mlp.experts.22.up_proj", "model.layers.12.mlp.experts.23.up_proj", "model.layers.12.mlp.experts.24.up_proj", "model.layers.12.mlp.experts.25.up_proj", "model.layers.12.mlp.experts.26.up_proj", "model.layers.12.mlp.experts.27.up_proj", "model.layers.12.mlp.experts.28.up_proj", "model.layers.12.mlp.experts.29.up_proj", "model.layers.12.mlp.experts.30.up_proj", "model.layers.12.mlp.experts.31.up_proj", "model.layers.12.mlp.experts.32.up_proj", "model.layers.12.mlp.experts.33.up_proj", "model.layers.12.mlp.experts.34.up_proj", "model.layers.12.mlp.experts.35.up_proj", "model.layers.12.mlp.experts.36.up_proj", "model.layers.12.mlp.experts.37.up_proj", "model.layers.12.mlp.experts.38.up_proj", "model.layers.12.mlp.experts.39.up_proj", "model.layers.12.mlp.experts.40.up_proj", "model.layers.12.mlp.experts.41.up_proj", "model.layers.12.mlp.experts.42.up_proj", "model.layers.12.mlp.experts.43.up_proj", "model.layers.12.mlp.experts.44.up_proj", "model.layers.12.mlp.experts.45.up_proj", "model.layers.12.mlp.experts.46.up_proj", "model.layers.12.mlp.experts.47.up_proj", "model.layers.12.mlp.experts.48.up_proj", "model.layers.12.mlp.experts.49.up_proj", "model.layers.12.mlp.experts.50.up_proj", "model.layers.12.mlp.experts.51.up_proj", "model.layers.12.mlp.experts.52.up_proj", "model.layers.12.mlp.experts.53.up_proj", "model.layers.12.mlp.experts.54.up_proj", "model.layers.12.mlp.experts.55.up_proj", "model.layers.12.mlp.experts.56.up_proj", "model.layers.12.mlp.experts.57.up_proj", "model.layers.12.mlp.experts.58.up_proj", "model.layers.12.mlp.experts.59.up_proj", "model.layers.12.mlp.experts.60.up_proj", "model.layers.12.mlp.experts.61.up_proj", "model.layers.12.mlp.experts.62.up_proj", "model.layers.12.mlp.experts.63.up_proj", "model.layers.12.mlp.experts.64.up_proj", "model.layers.12.mlp.experts.65.up_proj", "model.layers.12.mlp.experts.66.up_proj", "model.layers.12.mlp.experts.67.up_proj", "model.layers.12.mlp.experts.68.up_proj", "model.layers.12.mlp.experts.69.up_proj", "model.layers.12.mlp.experts.70.up_proj", "model.layers.12.mlp.experts.71.up_proj", "model.layers.12.mlp.experts.72.up_proj", "model.layers.12.mlp.experts.73.up_proj", "model.layers.12.mlp.experts.74.up_proj", "model.layers.12.mlp.experts.75.up_proj", "model.layers.12.mlp.experts.76.up_proj", "model.layers.12.mlp.experts.77.up_proj", "model.layers.12.mlp.experts.78.up_proj", "model.layers.12.mlp.experts.79.up_proj", "model.layers.12.mlp.experts.80.up_proj", "model.layers.12.mlp.experts.81.up_proj", "model.layers.12.mlp.experts.82.up_proj", "model.layers.12.mlp.experts.83.up_proj", "model.layers.12.mlp.experts.84.up_proj", "model.layers.12.mlp.experts.85.up_proj", "model.layers.12.mlp.experts.86.up_proj", "model.layers.12.mlp.experts.87.up_proj", "model.layers.12.mlp.experts.88.up_proj", "model.layers.12.mlp.experts.89.up_proj", "model.layers.12.mlp.experts.90.up_proj", "model.layers.12.mlp.experts.91.up_proj", "model.layers.12.mlp.experts.92.up_proj", "model.layers.12.mlp.experts.93.up_proj", "model.layers.12.mlp.experts.94.up_proj", "model.layers.12.mlp.experts.95.up_proj", "model.layers.12.mlp.experts.96.up_proj", "model.layers.12.mlp.experts.97.up_proj", "model.layers.12.mlp.experts.98.up_proj", "model.layers.12.mlp.experts.99.up_proj", "model.layers.12.mlp.experts.100.up_proj", "model.layers.12.mlp.experts.101.up_proj", "model.layers.12.mlp.experts.102.up_proj", "model.layers.12.mlp.experts.103.up_proj", "model.layers.12.mlp.experts.104.up_proj", "model.layers.12.mlp.experts.105.up_proj", "model.layers.12.mlp.experts.106.up_proj", "model.layers.12.mlp.experts.107.up_proj", "model.layers.12.mlp.experts.108.up_proj", "model.layers.12.mlp.experts.109.up_proj", "model.layers.12.mlp.experts.110.up_proj", "model.layers.12.mlp.experts.111.up_proj", "model.layers.12.mlp.experts.112.up_proj", "model.layers.12.mlp.experts.113.up_proj", "model.layers.12.mlp.experts.114.up_proj", "model.layers.12.mlp.experts.115.up_proj", "model.layers.12.mlp.experts.116.up_proj", "model.layers.12.mlp.experts.117.up_proj", "model.layers.12.mlp.experts.118.up_proj", "model.layers.12.mlp.experts.119.up_proj", "model.layers.12.mlp.experts.120.up_proj", "model.layers.12.mlp.experts.121.up_proj", "model.layers.12.mlp.experts.122.up_proj", "model.layers.12.mlp.experts.123.up_proj", "model.layers.12.mlp.experts.124.up_proj", "model.layers.12.mlp.experts.125.up_proj", "model.layers.12.mlp.experts.126.up_proj", "model.layers.12.mlp.experts.127.up_proj", "model.layers.12.mlp.experts.128.up_proj", "model.layers.12.mlp.experts.129.up_proj", "model.layers.12.mlp.experts.130.up_proj", "model.layers.12.mlp.experts.131.up_proj", "model.layers.12.mlp.experts.132.up_proj", "model.layers.12.mlp.experts.133.up_proj", "model.layers.12.mlp.experts.134.up_proj", "model.layers.12.mlp.experts.135.up_proj", "model.layers.12.mlp.experts.136.up_proj", "model.layers.12.mlp.experts.137.up_proj", "model.layers.12.mlp.experts.138.up_proj", "model.layers.12.mlp.experts.139.up_proj", "model.layers.12.mlp.experts.140.up_proj", "model.layers.12.mlp.experts.141.up_proj", "model.layers.12.mlp.experts.142.up_proj", "model.layers.12.mlp.experts.143.up_proj", "model.layers.12.mlp.experts.144.up_proj", "model.layers.12.mlp.experts.145.up_proj", "model.layers.12.mlp.experts.146.up_proj", "model.layers.12.mlp.experts.147.up_proj", "model.layers.12.mlp.experts.148.up_proj", "model.layers.12.mlp.experts.149.up_proj", "model.layers.12.mlp.experts.150.up_proj", "model.layers.12.mlp.experts.151.up_proj", "model.layers.12.mlp.experts.152.up_proj", "model.layers.12.mlp.experts.153.up_proj", "model.layers.12.mlp.experts.154.up_proj", "model.layers.12.mlp.experts.155.up_proj", "model.layers.12.mlp.experts.156.up_proj", "model.layers.12.mlp.experts.157.up_proj", "model.layers.12.mlp.experts.158.up_proj", "model.layers.12.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -5.503208376467228e-05, "dbits": 2516582400 }, { "dkld": -6.769178435206413e-05, "dbits": 5033164800 } ] }, { "idx": 74, "layers": [ "model.layers.12.mlp.experts.0.down_proj", "model.layers.12.mlp.experts.1.down_proj", "model.layers.12.mlp.experts.2.down_proj", "model.layers.12.mlp.experts.3.down_proj", "model.layers.12.mlp.experts.4.down_proj", "model.layers.12.mlp.experts.5.down_proj", "model.layers.12.mlp.experts.6.down_proj", "model.layers.12.mlp.experts.7.down_proj", "model.layers.12.mlp.experts.8.down_proj", "model.layers.12.mlp.experts.9.down_proj", "model.layers.12.mlp.experts.10.down_proj", "model.layers.12.mlp.experts.11.down_proj", "model.layers.12.mlp.experts.12.down_proj", "model.layers.12.mlp.experts.13.down_proj", "model.layers.12.mlp.experts.14.down_proj", "model.layers.12.mlp.experts.15.down_proj", "model.layers.12.mlp.experts.16.down_proj", "model.layers.12.mlp.experts.17.down_proj", "model.layers.12.mlp.experts.18.down_proj", "model.layers.12.mlp.experts.19.down_proj", "model.layers.12.mlp.experts.20.down_proj", "model.layers.12.mlp.experts.21.down_proj", "model.layers.12.mlp.experts.22.down_proj", "model.layers.12.mlp.experts.23.down_proj", "model.layers.12.mlp.experts.24.down_proj", "model.layers.12.mlp.experts.25.down_proj", "model.layers.12.mlp.experts.26.down_proj", "model.layers.12.mlp.experts.27.down_proj", "model.layers.12.mlp.experts.28.down_proj", "model.layers.12.mlp.experts.29.down_proj", "model.layers.12.mlp.experts.30.down_proj", "model.layers.12.mlp.experts.31.down_proj", "model.layers.12.mlp.experts.32.down_proj", "model.layers.12.mlp.experts.33.down_proj", "model.layers.12.mlp.experts.34.down_proj", "model.layers.12.mlp.experts.35.down_proj", "model.layers.12.mlp.experts.36.down_proj", "model.layers.12.mlp.experts.37.down_proj", "model.layers.12.mlp.experts.38.down_proj", "model.layers.12.mlp.experts.39.down_proj", "model.layers.12.mlp.experts.40.down_proj", "model.layers.12.mlp.experts.41.down_proj", "model.layers.12.mlp.experts.42.down_proj", "model.layers.12.mlp.experts.43.down_proj", "model.layers.12.mlp.experts.44.down_proj", "model.layers.12.mlp.experts.45.down_proj", "model.layers.12.mlp.experts.46.down_proj", "model.layers.12.mlp.experts.47.down_proj", "model.layers.12.mlp.experts.48.down_proj", "model.layers.12.mlp.experts.49.down_proj", "model.layers.12.mlp.experts.50.down_proj", "model.layers.12.mlp.experts.51.down_proj", "model.layers.12.mlp.experts.52.down_proj", "model.layers.12.mlp.experts.53.down_proj", "model.layers.12.mlp.experts.54.down_proj", "model.layers.12.mlp.experts.55.down_proj", "model.layers.12.mlp.experts.56.down_proj", "model.layers.12.mlp.experts.57.down_proj", "model.layers.12.mlp.experts.58.down_proj", "model.layers.12.mlp.experts.59.down_proj", "model.layers.12.mlp.experts.60.down_proj", "model.layers.12.mlp.experts.61.down_proj", "model.layers.12.mlp.experts.62.down_proj", "model.layers.12.mlp.experts.63.down_proj", "model.layers.12.mlp.experts.64.down_proj", "model.layers.12.mlp.experts.65.down_proj", "model.layers.12.mlp.experts.66.down_proj", "model.layers.12.mlp.experts.67.down_proj", "model.layers.12.mlp.experts.68.down_proj", "model.layers.12.mlp.experts.69.down_proj", "model.layers.12.mlp.experts.70.down_proj", "model.layers.12.mlp.experts.71.down_proj", "model.layers.12.mlp.experts.72.down_proj", "model.layers.12.mlp.experts.73.down_proj", "model.layers.12.mlp.experts.74.down_proj", "model.layers.12.mlp.experts.75.down_proj", "model.layers.12.mlp.experts.76.down_proj", "model.layers.12.mlp.experts.77.down_proj", "model.layers.12.mlp.experts.78.down_proj", "model.layers.12.mlp.experts.79.down_proj", "model.layers.12.mlp.experts.80.down_proj", "model.layers.12.mlp.experts.81.down_proj", "model.layers.12.mlp.experts.82.down_proj", "model.layers.12.mlp.experts.83.down_proj", "model.layers.12.mlp.experts.84.down_proj", "model.layers.12.mlp.experts.85.down_proj", "model.layers.12.mlp.experts.86.down_proj", "model.layers.12.mlp.experts.87.down_proj", "model.layers.12.mlp.experts.88.down_proj", "model.layers.12.mlp.experts.89.down_proj", "model.layers.12.mlp.experts.90.down_proj", "model.layers.12.mlp.experts.91.down_proj", "model.layers.12.mlp.experts.92.down_proj", "model.layers.12.mlp.experts.93.down_proj", "model.layers.12.mlp.experts.94.down_proj", "model.layers.12.mlp.experts.95.down_proj", "model.layers.12.mlp.experts.96.down_proj", "model.layers.12.mlp.experts.97.down_proj", "model.layers.12.mlp.experts.98.down_proj", "model.layers.12.mlp.experts.99.down_proj", "model.layers.12.mlp.experts.100.down_proj", "model.layers.12.mlp.experts.101.down_proj", "model.layers.12.mlp.experts.102.down_proj", "model.layers.12.mlp.experts.103.down_proj", "model.layers.12.mlp.experts.104.down_proj", "model.layers.12.mlp.experts.105.down_proj", "model.layers.12.mlp.experts.106.down_proj", "model.layers.12.mlp.experts.107.down_proj", "model.layers.12.mlp.experts.108.down_proj", "model.layers.12.mlp.experts.109.down_proj", "model.layers.12.mlp.experts.110.down_proj", "model.layers.12.mlp.experts.111.down_proj", "model.layers.12.mlp.experts.112.down_proj", "model.layers.12.mlp.experts.113.down_proj", "model.layers.12.mlp.experts.114.down_proj", "model.layers.12.mlp.experts.115.down_proj", "model.layers.12.mlp.experts.116.down_proj", "model.layers.12.mlp.experts.117.down_proj", "model.layers.12.mlp.experts.118.down_proj", "model.layers.12.mlp.experts.119.down_proj", "model.layers.12.mlp.experts.120.down_proj", "model.layers.12.mlp.experts.121.down_proj", "model.layers.12.mlp.experts.122.down_proj", "model.layers.12.mlp.experts.123.down_proj", "model.layers.12.mlp.experts.124.down_proj", "model.layers.12.mlp.experts.125.down_proj", "model.layers.12.mlp.experts.126.down_proj", "model.layers.12.mlp.experts.127.down_proj", "model.layers.12.mlp.experts.128.down_proj", "model.layers.12.mlp.experts.129.down_proj", "model.layers.12.mlp.experts.130.down_proj", "model.layers.12.mlp.experts.131.down_proj", "model.layers.12.mlp.experts.132.down_proj", "model.layers.12.mlp.experts.133.down_proj", "model.layers.12.mlp.experts.134.down_proj", "model.layers.12.mlp.experts.135.down_proj", "model.layers.12.mlp.experts.136.down_proj", "model.layers.12.mlp.experts.137.down_proj", "model.layers.12.mlp.experts.138.down_proj", "model.layers.12.mlp.experts.139.down_proj", "model.layers.12.mlp.experts.140.down_proj", "model.layers.12.mlp.experts.141.down_proj", "model.layers.12.mlp.experts.142.down_proj", "model.layers.12.mlp.experts.143.down_proj", "model.layers.12.mlp.experts.144.down_proj", "model.layers.12.mlp.experts.145.down_proj", "model.layers.12.mlp.experts.146.down_proj", "model.layers.12.mlp.experts.147.down_proj", "model.layers.12.mlp.experts.148.down_proj", "model.layers.12.mlp.experts.149.down_proj", "model.layers.12.mlp.experts.150.down_proj", "model.layers.12.mlp.experts.151.down_proj", "model.layers.12.mlp.experts.152.down_proj", "model.layers.12.mlp.experts.153.down_proj", "model.layers.12.mlp.experts.154.down_proj", "model.layers.12.mlp.experts.155.down_proj", "model.layers.12.mlp.experts.156.down_proj", "model.layers.12.mlp.experts.157.down_proj", "model.layers.12.mlp.experts.158.down_proj", "model.layers.12.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -5.273122806102003e-05, "dbits": 1258291200 }, { "dkld": -6.357193924486602e-05, "dbits": 2516582400 } ] }, { "idx": 75, "layers": [ "model.layers.13.self_attn.q_proj" ], "candidates": [ { "dkld": -0.0001015390967950211, "dbits": 62914560 }, { "dkld": -9.110525716096024e-05, "dbits": 125829120 } ] }, { "idx": 76, "layers": [ "model.layers.13.self_attn.k_proj", "model.layers.13.self_attn.v_proj" ], "candidates": [ { "dkld": -4.087204579263787e-05, "dbits": 10485760 }, { "dkld": 4.606575239449878e-05, "dbits": 20971520 } ] }, { "idx": 77, "layers": [ "model.layers.13.self_attn.o_proj" ], "candidates": [ { "dkld": -8.727719541638986e-05, "dbits": 62914560 }, { "dkld": -8.510849438607589e-05, "dbits": 125829120 } ] }, { "idx": 78, "layers": [ "model.layers.13.mlp.shared_experts.gate_proj", "model.layers.13.mlp.shared_experts.up_proj", "model.layers.13.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 0.0001737601589411504, "dbits": 23592960 }, { "dkld": 0.00020437347702682157, "dbits": 47185920 } ] }, { "idx": 79, "layers": [ "model.layers.13.mlp.experts.0.gate_proj", "model.layers.13.mlp.experts.1.gate_proj", "model.layers.13.mlp.experts.2.gate_proj", "model.layers.13.mlp.experts.3.gate_proj", "model.layers.13.mlp.experts.4.gate_proj", "model.layers.13.mlp.experts.5.gate_proj", "model.layers.13.mlp.experts.6.gate_proj", "model.layers.13.mlp.experts.7.gate_proj", "model.layers.13.mlp.experts.8.gate_proj", "model.layers.13.mlp.experts.9.gate_proj", "model.layers.13.mlp.experts.10.gate_proj", "model.layers.13.mlp.experts.11.gate_proj", "model.layers.13.mlp.experts.12.gate_proj", "model.layers.13.mlp.experts.13.gate_proj", "model.layers.13.mlp.experts.14.gate_proj", "model.layers.13.mlp.experts.15.gate_proj", "model.layers.13.mlp.experts.16.gate_proj", "model.layers.13.mlp.experts.17.gate_proj", "model.layers.13.mlp.experts.18.gate_proj", "model.layers.13.mlp.experts.19.gate_proj", "model.layers.13.mlp.experts.20.gate_proj", "model.layers.13.mlp.experts.21.gate_proj", "model.layers.13.mlp.experts.22.gate_proj", "model.layers.13.mlp.experts.23.gate_proj", "model.layers.13.mlp.experts.24.gate_proj", "model.layers.13.mlp.experts.25.gate_proj", "model.layers.13.mlp.experts.26.gate_proj", "model.layers.13.mlp.experts.27.gate_proj", "model.layers.13.mlp.experts.28.gate_proj", "model.layers.13.mlp.experts.29.gate_proj", "model.layers.13.mlp.experts.30.gate_proj", "model.layers.13.mlp.experts.31.gate_proj", "model.layers.13.mlp.experts.32.gate_proj", "model.layers.13.mlp.experts.33.gate_proj", "model.layers.13.mlp.experts.34.gate_proj", "model.layers.13.mlp.experts.35.gate_proj", "model.layers.13.mlp.experts.36.gate_proj", "model.layers.13.mlp.experts.37.gate_proj", "model.layers.13.mlp.experts.38.gate_proj", "model.layers.13.mlp.experts.39.gate_proj", "model.layers.13.mlp.experts.40.gate_proj", "model.layers.13.mlp.experts.41.gate_proj", "model.layers.13.mlp.experts.42.gate_proj", "model.layers.13.mlp.experts.43.gate_proj", "model.layers.13.mlp.experts.44.gate_proj", "model.layers.13.mlp.experts.45.gate_proj", "model.layers.13.mlp.experts.46.gate_proj", "model.layers.13.mlp.experts.47.gate_proj", "model.layers.13.mlp.experts.48.gate_proj", "model.layers.13.mlp.experts.49.gate_proj", "model.layers.13.mlp.experts.50.gate_proj", "model.layers.13.mlp.experts.51.gate_proj", "model.layers.13.mlp.experts.52.gate_proj", "model.layers.13.mlp.experts.53.gate_proj", "model.layers.13.mlp.experts.54.gate_proj", "model.layers.13.mlp.experts.55.gate_proj", "model.layers.13.mlp.experts.56.gate_proj", "model.layers.13.mlp.experts.57.gate_proj", "model.layers.13.mlp.experts.58.gate_proj", "model.layers.13.mlp.experts.59.gate_proj", "model.layers.13.mlp.experts.60.gate_proj", "model.layers.13.mlp.experts.61.gate_proj", "model.layers.13.mlp.experts.62.gate_proj", "model.layers.13.mlp.experts.63.gate_proj", "model.layers.13.mlp.experts.64.gate_proj", "model.layers.13.mlp.experts.65.gate_proj", "model.layers.13.mlp.experts.66.gate_proj", "model.layers.13.mlp.experts.67.gate_proj", "model.layers.13.mlp.experts.68.gate_proj", "model.layers.13.mlp.experts.69.gate_proj", "model.layers.13.mlp.experts.70.gate_proj", "model.layers.13.mlp.experts.71.gate_proj", "model.layers.13.mlp.experts.72.gate_proj", "model.layers.13.mlp.experts.73.gate_proj", "model.layers.13.mlp.experts.74.gate_proj", "model.layers.13.mlp.experts.75.gate_proj", "model.layers.13.mlp.experts.76.gate_proj", "model.layers.13.mlp.experts.77.gate_proj", "model.layers.13.mlp.experts.78.gate_proj", "model.layers.13.mlp.experts.79.gate_proj", "model.layers.13.mlp.experts.80.gate_proj", "model.layers.13.mlp.experts.81.gate_proj", "model.layers.13.mlp.experts.82.gate_proj", "model.layers.13.mlp.experts.83.gate_proj", "model.layers.13.mlp.experts.84.gate_proj", "model.layers.13.mlp.experts.85.gate_proj", "model.layers.13.mlp.experts.86.gate_proj", "model.layers.13.mlp.experts.87.gate_proj", "model.layers.13.mlp.experts.88.gate_proj", "model.layers.13.mlp.experts.89.gate_proj", "model.layers.13.mlp.experts.90.gate_proj", "model.layers.13.mlp.experts.91.gate_proj", "model.layers.13.mlp.experts.92.gate_proj", "model.layers.13.mlp.experts.93.gate_proj", "model.layers.13.mlp.experts.94.gate_proj", "model.layers.13.mlp.experts.95.gate_proj", "model.layers.13.mlp.experts.96.gate_proj", "model.layers.13.mlp.experts.97.gate_proj", "model.layers.13.mlp.experts.98.gate_proj", "model.layers.13.mlp.experts.99.gate_proj", "model.layers.13.mlp.experts.100.gate_proj", "model.layers.13.mlp.experts.101.gate_proj", "model.layers.13.mlp.experts.102.gate_proj", "model.layers.13.mlp.experts.103.gate_proj", "model.layers.13.mlp.experts.104.gate_proj", "model.layers.13.mlp.experts.105.gate_proj", "model.layers.13.mlp.experts.106.gate_proj", "model.layers.13.mlp.experts.107.gate_proj", "model.layers.13.mlp.experts.108.gate_proj", "model.layers.13.mlp.experts.109.gate_proj", "model.layers.13.mlp.experts.110.gate_proj", "model.layers.13.mlp.experts.111.gate_proj", "model.layers.13.mlp.experts.112.gate_proj", "model.layers.13.mlp.experts.113.gate_proj", "model.layers.13.mlp.experts.114.gate_proj", "model.layers.13.mlp.experts.115.gate_proj", "model.layers.13.mlp.experts.116.gate_proj", "model.layers.13.mlp.experts.117.gate_proj", "model.layers.13.mlp.experts.118.gate_proj", "model.layers.13.mlp.experts.119.gate_proj", "model.layers.13.mlp.experts.120.gate_proj", "model.layers.13.mlp.experts.121.gate_proj", "model.layers.13.mlp.experts.122.gate_proj", "model.layers.13.mlp.experts.123.gate_proj", "model.layers.13.mlp.experts.124.gate_proj", "model.layers.13.mlp.experts.125.gate_proj", "model.layers.13.mlp.experts.126.gate_proj", "model.layers.13.mlp.experts.127.gate_proj", "model.layers.13.mlp.experts.128.gate_proj", "model.layers.13.mlp.experts.129.gate_proj", "model.layers.13.mlp.experts.130.gate_proj", "model.layers.13.mlp.experts.131.gate_proj", "model.layers.13.mlp.experts.132.gate_proj", "model.layers.13.mlp.experts.133.gate_proj", "model.layers.13.mlp.experts.134.gate_proj", "model.layers.13.mlp.experts.135.gate_proj", "model.layers.13.mlp.experts.136.gate_proj", "model.layers.13.mlp.experts.137.gate_proj", "model.layers.13.mlp.experts.138.gate_proj", "model.layers.13.mlp.experts.139.gate_proj", "model.layers.13.mlp.experts.140.gate_proj", "model.layers.13.mlp.experts.141.gate_proj", "model.layers.13.mlp.experts.142.gate_proj", "model.layers.13.mlp.experts.143.gate_proj", "model.layers.13.mlp.experts.144.gate_proj", "model.layers.13.mlp.experts.145.gate_proj", "model.layers.13.mlp.experts.146.gate_proj", "model.layers.13.mlp.experts.147.gate_proj", "model.layers.13.mlp.experts.148.gate_proj", "model.layers.13.mlp.experts.149.gate_proj", "model.layers.13.mlp.experts.150.gate_proj", "model.layers.13.mlp.experts.151.gate_proj", "model.layers.13.mlp.experts.152.gate_proj", "model.layers.13.mlp.experts.153.gate_proj", "model.layers.13.mlp.experts.154.gate_proj", "model.layers.13.mlp.experts.155.gate_proj", "model.layers.13.mlp.experts.156.gate_proj", "model.layers.13.mlp.experts.157.gate_proj", "model.layers.13.mlp.experts.158.gate_proj", "model.layers.13.mlp.experts.159.gate_proj", "model.layers.13.mlp.experts.0.up_proj", "model.layers.13.mlp.experts.1.up_proj", "model.layers.13.mlp.experts.2.up_proj", "model.layers.13.mlp.experts.3.up_proj", "model.layers.13.mlp.experts.4.up_proj", "model.layers.13.mlp.experts.5.up_proj", "model.layers.13.mlp.experts.6.up_proj", "model.layers.13.mlp.experts.7.up_proj", "model.layers.13.mlp.experts.8.up_proj", "model.layers.13.mlp.experts.9.up_proj", "model.layers.13.mlp.experts.10.up_proj", "model.layers.13.mlp.experts.11.up_proj", "model.layers.13.mlp.experts.12.up_proj", "model.layers.13.mlp.experts.13.up_proj", "model.layers.13.mlp.experts.14.up_proj", "model.layers.13.mlp.experts.15.up_proj", "model.layers.13.mlp.experts.16.up_proj", "model.layers.13.mlp.experts.17.up_proj", "model.layers.13.mlp.experts.18.up_proj", "model.layers.13.mlp.experts.19.up_proj", "model.layers.13.mlp.experts.20.up_proj", "model.layers.13.mlp.experts.21.up_proj", "model.layers.13.mlp.experts.22.up_proj", "model.layers.13.mlp.experts.23.up_proj", "model.layers.13.mlp.experts.24.up_proj", "model.layers.13.mlp.experts.25.up_proj", "model.layers.13.mlp.experts.26.up_proj", "model.layers.13.mlp.experts.27.up_proj", "model.layers.13.mlp.experts.28.up_proj", "model.layers.13.mlp.experts.29.up_proj", "model.layers.13.mlp.experts.30.up_proj", "model.layers.13.mlp.experts.31.up_proj", "model.layers.13.mlp.experts.32.up_proj", "model.layers.13.mlp.experts.33.up_proj", "model.layers.13.mlp.experts.34.up_proj", "model.layers.13.mlp.experts.35.up_proj", "model.layers.13.mlp.experts.36.up_proj", "model.layers.13.mlp.experts.37.up_proj", "model.layers.13.mlp.experts.38.up_proj", "model.layers.13.mlp.experts.39.up_proj", "model.layers.13.mlp.experts.40.up_proj", "model.layers.13.mlp.experts.41.up_proj", "model.layers.13.mlp.experts.42.up_proj", "model.layers.13.mlp.experts.43.up_proj", "model.layers.13.mlp.experts.44.up_proj", "model.layers.13.mlp.experts.45.up_proj", "model.layers.13.mlp.experts.46.up_proj", "model.layers.13.mlp.experts.47.up_proj", "model.layers.13.mlp.experts.48.up_proj", "model.layers.13.mlp.experts.49.up_proj", "model.layers.13.mlp.experts.50.up_proj", "model.layers.13.mlp.experts.51.up_proj", "model.layers.13.mlp.experts.52.up_proj", "model.layers.13.mlp.experts.53.up_proj", "model.layers.13.mlp.experts.54.up_proj", "model.layers.13.mlp.experts.55.up_proj", "model.layers.13.mlp.experts.56.up_proj", "model.layers.13.mlp.experts.57.up_proj", "model.layers.13.mlp.experts.58.up_proj", "model.layers.13.mlp.experts.59.up_proj", "model.layers.13.mlp.experts.60.up_proj", "model.layers.13.mlp.experts.61.up_proj", "model.layers.13.mlp.experts.62.up_proj", "model.layers.13.mlp.experts.63.up_proj", "model.layers.13.mlp.experts.64.up_proj", "model.layers.13.mlp.experts.65.up_proj", "model.layers.13.mlp.experts.66.up_proj", "model.layers.13.mlp.experts.67.up_proj", "model.layers.13.mlp.experts.68.up_proj", "model.layers.13.mlp.experts.69.up_proj", "model.layers.13.mlp.experts.70.up_proj", "model.layers.13.mlp.experts.71.up_proj", "model.layers.13.mlp.experts.72.up_proj", "model.layers.13.mlp.experts.73.up_proj", "model.layers.13.mlp.experts.74.up_proj", "model.layers.13.mlp.experts.75.up_proj", "model.layers.13.mlp.experts.76.up_proj", "model.layers.13.mlp.experts.77.up_proj", "model.layers.13.mlp.experts.78.up_proj", "model.layers.13.mlp.experts.79.up_proj", "model.layers.13.mlp.experts.80.up_proj", "model.layers.13.mlp.experts.81.up_proj", "model.layers.13.mlp.experts.82.up_proj", "model.layers.13.mlp.experts.83.up_proj", "model.layers.13.mlp.experts.84.up_proj", "model.layers.13.mlp.experts.85.up_proj", "model.layers.13.mlp.experts.86.up_proj", "model.layers.13.mlp.experts.87.up_proj", "model.layers.13.mlp.experts.88.up_proj", "model.layers.13.mlp.experts.89.up_proj", "model.layers.13.mlp.experts.90.up_proj", "model.layers.13.mlp.experts.91.up_proj", "model.layers.13.mlp.experts.92.up_proj", "model.layers.13.mlp.experts.93.up_proj", "model.layers.13.mlp.experts.94.up_proj", "model.layers.13.mlp.experts.95.up_proj", "model.layers.13.mlp.experts.96.up_proj", "model.layers.13.mlp.experts.97.up_proj", "model.layers.13.mlp.experts.98.up_proj", "model.layers.13.mlp.experts.99.up_proj", "model.layers.13.mlp.experts.100.up_proj", "model.layers.13.mlp.experts.101.up_proj", "model.layers.13.mlp.experts.102.up_proj", "model.layers.13.mlp.experts.103.up_proj", "model.layers.13.mlp.experts.104.up_proj", "model.layers.13.mlp.experts.105.up_proj", "model.layers.13.mlp.experts.106.up_proj", "model.layers.13.mlp.experts.107.up_proj", "model.layers.13.mlp.experts.108.up_proj", "model.layers.13.mlp.experts.109.up_proj", "model.layers.13.mlp.experts.110.up_proj", "model.layers.13.mlp.experts.111.up_proj", "model.layers.13.mlp.experts.112.up_proj", "model.layers.13.mlp.experts.113.up_proj", "model.layers.13.mlp.experts.114.up_proj", "model.layers.13.mlp.experts.115.up_proj", "model.layers.13.mlp.experts.116.up_proj", "model.layers.13.mlp.experts.117.up_proj", "model.layers.13.mlp.experts.118.up_proj", "model.layers.13.mlp.experts.119.up_proj", "model.layers.13.mlp.experts.120.up_proj", "model.layers.13.mlp.experts.121.up_proj", "model.layers.13.mlp.experts.122.up_proj", "model.layers.13.mlp.experts.123.up_proj", "model.layers.13.mlp.experts.124.up_proj", "model.layers.13.mlp.experts.125.up_proj", "model.layers.13.mlp.experts.126.up_proj", "model.layers.13.mlp.experts.127.up_proj", "model.layers.13.mlp.experts.128.up_proj", "model.layers.13.mlp.experts.129.up_proj", "model.layers.13.mlp.experts.130.up_proj", "model.layers.13.mlp.experts.131.up_proj", "model.layers.13.mlp.experts.132.up_proj", "model.layers.13.mlp.experts.133.up_proj", "model.layers.13.mlp.experts.134.up_proj", "model.layers.13.mlp.experts.135.up_proj", "model.layers.13.mlp.experts.136.up_proj", "model.layers.13.mlp.experts.137.up_proj", "model.layers.13.mlp.experts.138.up_proj", "model.layers.13.mlp.experts.139.up_proj", "model.layers.13.mlp.experts.140.up_proj", "model.layers.13.mlp.experts.141.up_proj", "model.layers.13.mlp.experts.142.up_proj", "model.layers.13.mlp.experts.143.up_proj", "model.layers.13.mlp.experts.144.up_proj", "model.layers.13.mlp.experts.145.up_proj", "model.layers.13.mlp.experts.146.up_proj", "model.layers.13.mlp.experts.147.up_proj", "model.layers.13.mlp.experts.148.up_proj", "model.layers.13.mlp.experts.149.up_proj", "model.layers.13.mlp.experts.150.up_proj", "model.layers.13.mlp.experts.151.up_proj", "model.layers.13.mlp.experts.152.up_proj", "model.layers.13.mlp.experts.153.up_proj", "model.layers.13.mlp.experts.154.up_proj", "model.layers.13.mlp.experts.155.up_proj", "model.layers.13.mlp.experts.156.up_proj", "model.layers.13.mlp.experts.157.up_proj", "model.layers.13.mlp.experts.158.up_proj", "model.layers.13.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -7.293904200196197e-05, "dbits": 2516582400 }, { "dkld": -0.0001513298135250793, "dbits": 5033164800 } ] }, { "idx": 80, "layers": [ "model.layers.13.mlp.experts.0.down_proj", "model.layers.13.mlp.experts.1.down_proj", "model.layers.13.mlp.experts.2.down_proj", "model.layers.13.mlp.experts.3.down_proj", "model.layers.13.mlp.experts.4.down_proj", "model.layers.13.mlp.experts.5.down_proj", "model.layers.13.mlp.experts.6.down_proj", "model.layers.13.mlp.experts.7.down_proj", "model.layers.13.mlp.experts.8.down_proj", "model.layers.13.mlp.experts.9.down_proj", "model.layers.13.mlp.experts.10.down_proj", "model.layers.13.mlp.experts.11.down_proj", "model.layers.13.mlp.experts.12.down_proj", "model.layers.13.mlp.experts.13.down_proj", "model.layers.13.mlp.experts.14.down_proj", "model.layers.13.mlp.experts.15.down_proj", "model.layers.13.mlp.experts.16.down_proj", "model.layers.13.mlp.experts.17.down_proj", "model.layers.13.mlp.experts.18.down_proj", "model.layers.13.mlp.experts.19.down_proj", "model.layers.13.mlp.experts.20.down_proj", "model.layers.13.mlp.experts.21.down_proj", "model.layers.13.mlp.experts.22.down_proj", "model.layers.13.mlp.experts.23.down_proj", "model.layers.13.mlp.experts.24.down_proj", "model.layers.13.mlp.experts.25.down_proj", "model.layers.13.mlp.experts.26.down_proj", "model.layers.13.mlp.experts.27.down_proj", "model.layers.13.mlp.experts.28.down_proj", "model.layers.13.mlp.experts.29.down_proj", "model.layers.13.mlp.experts.30.down_proj", "model.layers.13.mlp.experts.31.down_proj", "model.layers.13.mlp.experts.32.down_proj", "model.layers.13.mlp.experts.33.down_proj", "model.layers.13.mlp.experts.34.down_proj", "model.layers.13.mlp.experts.35.down_proj", "model.layers.13.mlp.experts.36.down_proj", "model.layers.13.mlp.experts.37.down_proj", "model.layers.13.mlp.experts.38.down_proj", "model.layers.13.mlp.experts.39.down_proj", "model.layers.13.mlp.experts.40.down_proj", "model.layers.13.mlp.experts.41.down_proj", "model.layers.13.mlp.experts.42.down_proj", "model.layers.13.mlp.experts.43.down_proj", "model.layers.13.mlp.experts.44.down_proj", "model.layers.13.mlp.experts.45.down_proj", "model.layers.13.mlp.experts.46.down_proj", "model.layers.13.mlp.experts.47.down_proj", "model.layers.13.mlp.experts.48.down_proj", "model.layers.13.mlp.experts.49.down_proj", "model.layers.13.mlp.experts.50.down_proj", "model.layers.13.mlp.experts.51.down_proj", "model.layers.13.mlp.experts.52.down_proj", "model.layers.13.mlp.experts.53.down_proj", "model.layers.13.mlp.experts.54.down_proj", "model.layers.13.mlp.experts.55.down_proj", "model.layers.13.mlp.experts.56.down_proj", "model.layers.13.mlp.experts.57.down_proj", "model.layers.13.mlp.experts.58.down_proj", "model.layers.13.mlp.experts.59.down_proj", "model.layers.13.mlp.experts.60.down_proj", "model.layers.13.mlp.experts.61.down_proj", "model.layers.13.mlp.experts.62.down_proj", "model.layers.13.mlp.experts.63.down_proj", "model.layers.13.mlp.experts.64.down_proj", "model.layers.13.mlp.experts.65.down_proj", "model.layers.13.mlp.experts.66.down_proj", "model.layers.13.mlp.experts.67.down_proj", "model.layers.13.mlp.experts.68.down_proj", "model.layers.13.mlp.experts.69.down_proj", "model.layers.13.mlp.experts.70.down_proj", "model.layers.13.mlp.experts.71.down_proj", "model.layers.13.mlp.experts.72.down_proj", "model.layers.13.mlp.experts.73.down_proj", "model.layers.13.mlp.experts.74.down_proj", "model.layers.13.mlp.experts.75.down_proj", "model.layers.13.mlp.experts.76.down_proj", "model.layers.13.mlp.experts.77.down_proj", "model.layers.13.mlp.experts.78.down_proj", "model.layers.13.mlp.experts.79.down_proj", "model.layers.13.mlp.experts.80.down_proj", "model.layers.13.mlp.experts.81.down_proj", "model.layers.13.mlp.experts.82.down_proj", "model.layers.13.mlp.experts.83.down_proj", "model.layers.13.mlp.experts.84.down_proj", "model.layers.13.mlp.experts.85.down_proj", "model.layers.13.mlp.experts.86.down_proj", "model.layers.13.mlp.experts.87.down_proj", "model.layers.13.mlp.experts.88.down_proj", "model.layers.13.mlp.experts.89.down_proj", "model.layers.13.mlp.experts.90.down_proj", "model.layers.13.mlp.experts.91.down_proj", "model.layers.13.mlp.experts.92.down_proj", "model.layers.13.mlp.experts.93.down_proj", "model.layers.13.mlp.experts.94.down_proj", "model.layers.13.mlp.experts.95.down_proj", "model.layers.13.mlp.experts.96.down_proj", "model.layers.13.mlp.experts.97.down_proj", "model.layers.13.mlp.experts.98.down_proj", "model.layers.13.mlp.experts.99.down_proj", "model.layers.13.mlp.experts.100.down_proj", "model.layers.13.mlp.experts.101.down_proj", "model.layers.13.mlp.experts.102.down_proj", "model.layers.13.mlp.experts.103.down_proj", "model.layers.13.mlp.experts.104.down_proj", "model.layers.13.mlp.experts.105.down_proj", "model.layers.13.mlp.experts.106.down_proj", "model.layers.13.mlp.experts.107.down_proj", "model.layers.13.mlp.experts.108.down_proj", "model.layers.13.mlp.experts.109.down_proj", "model.layers.13.mlp.experts.110.down_proj", "model.layers.13.mlp.experts.111.down_proj", "model.layers.13.mlp.experts.112.down_proj", "model.layers.13.mlp.experts.113.down_proj", "model.layers.13.mlp.experts.114.down_proj", "model.layers.13.mlp.experts.115.down_proj", "model.layers.13.mlp.experts.116.down_proj", "model.layers.13.mlp.experts.117.down_proj", "model.layers.13.mlp.experts.118.down_proj", "model.layers.13.mlp.experts.119.down_proj", "model.layers.13.mlp.experts.120.down_proj", "model.layers.13.mlp.experts.121.down_proj", "model.layers.13.mlp.experts.122.down_proj", "model.layers.13.mlp.experts.123.down_proj", "model.layers.13.mlp.experts.124.down_proj", "model.layers.13.mlp.experts.125.down_proj", "model.layers.13.mlp.experts.126.down_proj", "model.layers.13.mlp.experts.127.down_proj", "model.layers.13.mlp.experts.128.down_proj", "model.layers.13.mlp.experts.129.down_proj", "model.layers.13.mlp.experts.130.down_proj", "model.layers.13.mlp.experts.131.down_proj", "model.layers.13.mlp.experts.132.down_proj", "model.layers.13.mlp.experts.133.down_proj", "model.layers.13.mlp.experts.134.down_proj", "model.layers.13.mlp.experts.135.down_proj", "model.layers.13.mlp.experts.136.down_proj", "model.layers.13.mlp.experts.137.down_proj", "model.layers.13.mlp.experts.138.down_proj", "model.layers.13.mlp.experts.139.down_proj", "model.layers.13.mlp.experts.140.down_proj", "model.layers.13.mlp.experts.141.down_proj", "model.layers.13.mlp.experts.142.down_proj", "model.layers.13.mlp.experts.143.down_proj", "model.layers.13.mlp.experts.144.down_proj", "model.layers.13.mlp.experts.145.down_proj", "model.layers.13.mlp.experts.146.down_proj", "model.layers.13.mlp.experts.147.down_proj", "model.layers.13.mlp.experts.148.down_proj", "model.layers.13.mlp.experts.149.down_proj", "model.layers.13.mlp.experts.150.down_proj", "model.layers.13.mlp.experts.151.down_proj", "model.layers.13.mlp.experts.152.down_proj", "model.layers.13.mlp.experts.153.down_proj", "model.layers.13.mlp.experts.154.down_proj", "model.layers.13.mlp.experts.155.down_proj", "model.layers.13.mlp.experts.156.down_proj", "model.layers.13.mlp.experts.157.down_proj", "model.layers.13.mlp.experts.158.down_proj", "model.layers.13.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -0.00013361414894461597, "dbits": 1258291200 }, { "dkld": -0.00017687415238469735, "dbits": 2516582400 } ] }, { "idx": 81, "layers": [ "model.layers.14.self_attn.q_proj" ], "candidates": [ { "dkld": 1.8151570111514526e-05, "dbits": 62914560 }, { "dkld": -2.84439185634245e-05, "dbits": 125829120 } ] }, { "idx": 82, "layers": [ "model.layers.14.self_attn.k_proj", "model.layers.14.self_attn.v_proj" ], "candidates": [ { "dkld": 0.00011145723983645509, "dbits": 10485760 }, { "dkld": 0.00010484959930181538, "dbits": 20971520 } ] }, { "idx": 83, "layers": [ "model.layers.14.self_attn.o_proj" ], "candidates": [ { "dkld": -0.0002401652978733168, "dbits": 62914560 }, { "dkld": -0.00022975404281169037, "dbits": 125829120 } ] }, { "idx": 84, "layers": [ "model.layers.14.mlp.shared_experts.gate_proj", "model.layers.14.mlp.shared_experts.up_proj", "model.layers.14.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -3.0504772439599037e-05, "dbits": 23592960 }, { "dkld": -3.840955905616214e-05, "dbits": 47185920 } ] }, { "idx": 85, "layers": [ "model.layers.14.mlp.experts.0.gate_proj", "model.layers.14.mlp.experts.1.gate_proj", "model.layers.14.mlp.experts.2.gate_proj", "model.layers.14.mlp.experts.3.gate_proj", "model.layers.14.mlp.experts.4.gate_proj", "model.layers.14.mlp.experts.5.gate_proj", "model.layers.14.mlp.experts.6.gate_proj", "model.layers.14.mlp.experts.7.gate_proj", "model.layers.14.mlp.experts.8.gate_proj", "model.layers.14.mlp.experts.9.gate_proj", "model.layers.14.mlp.experts.10.gate_proj", "model.layers.14.mlp.experts.11.gate_proj", "model.layers.14.mlp.experts.12.gate_proj", "model.layers.14.mlp.experts.13.gate_proj", "model.layers.14.mlp.experts.14.gate_proj", "model.layers.14.mlp.experts.15.gate_proj", "model.layers.14.mlp.experts.16.gate_proj", "model.layers.14.mlp.experts.17.gate_proj", "model.layers.14.mlp.experts.18.gate_proj", "model.layers.14.mlp.experts.19.gate_proj", "model.layers.14.mlp.experts.20.gate_proj", "model.layers.14.mlp.experts.21.gate_proj", "model.layers.14.mlp.experts.22.gate_proj", "model.layers.14.mlp.experts.23.gate_proj", "model.layers.14.mlp.experts.24.gate_proj", "model.layers.14.mlp.experts.25.gate_proj", "model.layers.14.mlp.experts.26.gate_proj", "model.layers.14.mlp.experts.27.gate_proj", "model.layers.14.mlp.experts.28.gate_proj", "model.layers.14.mlp.experts.29.gate_proj", "model.layers.14.mlp.experts.30.gate_proj", "model.layers.14.mlp.experts.31.gate_proj", "model.layers.14.mlp.experts.32.gate_proj", "model.layers.14.mlp.experts.33.gate_proj", "model.layers.14.mlp.experts.34.gate_proj", "model.layers.14.mlp.experts.35.gate_proj", "model.layers.14.mlp.experts.36.gate_proj", "model.layers.14.mlp.experts.37.gate_proj", "model.layers.14.mlp.experts.38.gate_proj", "model.layers.14.mlp.experts.39.gate_proj", "model.layers.14.mlp.experts.40.gate_proj", "model.layers.14.mlp.experts.41.gate_proj", "model.layers.14.mlp.experts.42.gate_proj", "model.layers.14.mlp.experts.43.gate_proj", "model.layers.14.mlp.experts.44.gate_proj", "model.layers.14.mlp.experts.45.gate_proj", "model.layers.14.mlp.experts.46.gate_proj", "model.layers.14.mlp.experts.47.gate_proj", "model.layers.14.mlp.experts.48.gate_proj", "model.layers.14.mlp.experts.49.gate_proj", "model.layers.14.mlp.experts.50.gate_proj", "model.layers.14.mlp.experts.51.gate_proj", "model.layers.14.mlp.experts.52.gate_proj", "model.layers.14.mlp.experts.53.gate_proj", "model.layers.14.mlp.experts.54.gate_proj", "model.layers.14.mlp.experts.55.gate_proj", "model.layers.14.mlp.experts.56.gate_proj", "model.layers.14.mlp.experts.57.gate_proj", "model.layers.14.mlp.experts.58.gate_proj", "model.layers.14.mlp.experts.59.gate_proj", "model.layers.14.mlp.experts.60.gate_proj", "model.layers.14.mlp.experts.61.gate_proj", "model.layers.14.mlp.experts.62.gate_proj", "model.layers.14.mlp.experts.63.gate_proj", "model.layers.14.mlp.experts.64.gate_proj", "model.layers.14.mlp.experts.65.gate_proj", "model.layers.14.mlp.experts.66.gate_proj", "model.layers.14.mlp.experts.67.gate_proj", "model.layers.14.mlp.experts.68.gate_proj", "model.layers.14.mlp.experts.69.gate_proj", "model.layers.14.mlp.experts.70.gate_proj", "model.layers.14.mlp.experts.71.gate_proj", "model.layers.14.mlp.experts.72.gate_proj", "model.layers.14.mlp.experts.73.gate_proj", "model.layers.14.mlp.experts.74.gate_proj", "model.layers.14.mlp.experts.75.gate_proj", "model.layers.14.mlp.experts.76.gate_proj", "model.layers.14.mlp.experts.77.gate_proj", "model.layers.14.mlp.experts.78.gate_proj", "model.layers.14.mlp.experts.79.gate_proj", "model.layers.14.mlp.experts.80.gate_proj", "model.layers.14.mlp.experts.81.gate_proj", "model.layers.14.mlp.experts.82.gate_proj", "model.layers.14.mlp.experts.83.gate_proj", "model.layers.14.mlp.experts.84.gate_proj", "model.layers.14.mlp.experts.85.gate_proj", "model.layers.14.mlp.experts.86.gate_proj", "model.layers.14.mlp.experts.87.gate_proj", "model.layers.14.mlp.experts.88.gate_proj", "model.layers.14.mlp.experts.89.gate_proj", "model.layers.14.mlp.experts.90.gate_proj", "model.layers.14.mlp.experts.91.gate_proj", "model.layers.14.mlp.experts.92.gate_proj", "model.layers.14.mlp.experts.93.gate_proj", "model.layers.14.mlp.experts.94.gate_proj", "model.layers.14.mlp.experts.95.gate_proj", "model.layers.14.mlp.experts.96.gate_proj", "model.layers.14.mlp.experts.97.gate_proj", "model.layers.14.mlp.experts.98.gate_proj", "model.layers.14.mlp.experts.99.gate_proj", "model.layers.14.mlp.experts.100.gate_proj", "model.layers.14.mlp.experts.101.gate_proj", "model.layers.14.mlp.experts.102.gate_proj", "model.layers.14.mlp.experts.103.gate_proj", "model.layers.14.mlp.experts.104.gate_proj", "model.layers.14.mlp.experts.105.gate_proj", "model.layers.14.mlp.experts.106.gate_proj", "model.layers.14.mlp.experts.107.gate_proj", "model.layers.14.mlp.experts.108.gate_proj", "model.layers.14.mlp.experts.109.gate_proj", "model.layers.14.mlp.experts.110.gate_proj", "model.layers.14.mlp.experts.111.gate_proj", "model.layers.14.mlp.experts.112.gate_proj", "model.layers.14.mlp.experts.113.gate_proj", "model.layers.14.mlp.experts.114.gate_proj", "model.layers.14.mlp.experts.115.gate_proj", "model.layers.14.mlp.experts.116.gate_proj", "model.layers.14.mlp.experts.117.gate_proj", "model.layers.14.mlp.experts.118.gate_proj", "model.layers.14.mlp.experts.119.gate_proj", "model.layers.14.mlp.experts.120.gate_proj", "model.layers.14.mlp.experts.121.gate_proj", "model.layers.14.mlp.experts.122.gate_proj", "model.layers.14.mlp.experts.123.gate_proj", "model.layers.14.mlp.experts.124.gate_proj", "model.layers.14.mlp.experts.125.gate_proj", "model.layers.14.mlp.experts.126.gate_proj", "model.layers.14.mlp.experts.127.gate_proj", "model.layers.14.mlp.experts.128.gate_proj", "model.layers.14.mlp.experts.129.gate_proj", "model.layers.14.mlp.experts.130.gate_proj", "model.layers.14.mlp.experts.131.gate_proj", "model.layers.14.mlp.experts.132.gate_proj", "model.layers.14.mlp.experts.133.gate_proj", "model.layers.14.mlp.experts.134.gate_proj", "model.layers.14.mlp.experts.135.gate_proj", "model.layers.14.mlp.experts.136.gate_proj", "model.layers.14.mlp.experts.137.gate_proj", "model.layers.14.mlp.experts.138.gate_proj", "model.layers.14.mlp.experts.139.gate_proj", "model.layers.14.mlp.experts.140.gate_proj", "model.layers.14.mlp.experts.141.gate_proj", "model.layers.14.mlp.experts.142.gate_proj", "model.layers.14.mlp.experts.143.gate_proj", "model.layers.14.mlp.experts.144.gate_proj", "model.layers.14.mlp.experts.145.gate_proj", "model.layers.14.mlp.experts.146.gate_proj", "model.layers.14.mlp.experts.147.gate_proj", "model.layers.14.mlp.experts.148.gate_proj", "model.layers.14.mlp.experts.149.gate_proj", "model.layers.14.mlp.experts.150.gate_proj", "model.layers.14.mlp.experts.151.gate_proj", "model.layers.14.mlp.experts.152.gate_proj", "model.layers.14.mlp.experts.153.gate_proj", "model.layers.14.mlp.experts.154.gate_proj", "model.layers.14.mlp.experts.155.gate_proj", "model.layers.14.mlp.experts.156.gate_proj", "model.layers.14.mlp.experts.157.gate_proj", "model.layers.14.mlp.experts.158.gate_proj", "model.layers.14.mlp.experts.159.gate_proj", "model.layers.14.mlp.experts.0.up_proj", "model.layers.14.mlp.experts.1.up_proj", "model.layers.14.mlp.experts.2.up_proj", "model.layers.14.mlp.experts.3.up_proj", "model.layers.14.mlp.experts.4.up_proj", "model.layers.14.mlp.experts.5.up_proj", "model.layers.14.mlp.experts.6.up_proj", "model.layers.14.mlp.experts.7.up_proj", "model.layers.14.mlp.experts.8.up_proj", "model.layers.14.mlp.experts.9.up_proj", "model.layers.14.mlp.experts.10.up_proj", "model.layers.14.mlp.experts.11.up_proj", "model.layers.14.mlp.experts.12.up_proj", "model.layers.14.mlp.experts.13.up_proj", "model.layers.14.mlp.experts.14.up_proj", "model.layers.14.mlp.experts.15.up_proj", "model.layers.14.mlp.experts.16.up_proj", "model.layers.14.mlp.experts.17.up_proj", "model.layers.14.mlp.experts.18.up_proj", "model.layers.14.mlp.experts.19.up_proj", "model.layers.14.mlp.experts.20.up_proj", "model.layers.14.mlp.experts.21.up_proj", "model.layers.14.mlp.experts.22.up_proj", "model.layers.14.mlp.experts.23.up_proj", "model.layers.14.mlp.experts.24.up_proj", "model.layers.14.mlp.experts.25.up_proj", "model.layers.14.mlp.experts.26.up_proj", "model.layers.14.mlp.experts.27.up_proj", "model.layers.14.mlp.experts.28.up_proj", "model.layers.14.mlp.experts.29.up_proj", "model.layers.14.mlp.experts.30.up_proj", "model.layers.14.mlp.experts.31.up_proj", "model.layers.14.mlp.experts.32.up_proj", "model.layers.14.mlp.experts.33.up_proj", "model.layers.14.mlp.experts.34.up_proj", "model.layers.14.mlp.experts.35.up_proj", "model.layers.14.mlp.experts.36.up_proj", "model.layers.14.mlp.experts.37.up_proj", "model.layers.14.mlp.experts.38.up_proj", "model.layers.14.mlp.experts.39.up_proj", "model.layers.14.mlp.experts.40.up_proj", "model.layers.14.mlp.experts.41.up_proj", "model.layers.14.mlp.experts.42.up_proj", "model.layers.14.mlp.experts.43.up_proj", "model.layers.14.mlp.experts.44.up_proj", "model.layers.14.mlp.experts.45.up_proj", "model.layers.14.mlp.experts.46.up_proj", "model.layers.14.mlp.experts.47.up_proj", "model.layers.14.mlp.experts.48.up_proj", "model.layers.14.mlp.experts.49.up_proj", "model.layers.14.mlp.experts.50.up_proj", "model.layers.14.mlp.experts.51.up_proj", "model.layers.14.mlp.experts.52.up_proj", "model.layers.14.mlp.experts.53.up_proj", "model.layers.14.mlp.experts.54.up_proj", "model.layers.14.mlp.experts.55.up_proj", "model.layers.14.mlp.experts.56.up_proj", "model.layers.14.mlp.experts.57.up_proj", "model.layers.14.mlp.experts.58.up_proj", "model.layers.14.mlp.experts.59.up_proj", "model.layers.14.mlp.experts.60.up_proj", "model.layers.14.mlp.experts.61.up_proj", "model.layers.14.mlp.experts.62.up_proj", "model.layers.14.mlp.experts.63.up_proj", "model.layers.14.mlp.experts.64.up_proj", "model.layers.14.mlp.experts.65.up_proj", "model.layers.14.mlp.experts.66.up_proj", "model.layers.14.mlp.experts.67.up_proj", "model.layers.14.mlp.experts.68.up_proj", "model.layers.14.mlp.experts.69.up_proj", "model.layers.14.mlp.experts.70.up_proj", "model.layers.14.mlp.experts.71.up_proj", "model.layers.14.mlp.experts.72.up_proj", "model.layers.14.mlp.experts.73.up_proj", "model.layers.14.mlp.experts.74.up_proj", "model.layers.14.mlp.experts.75.up_proj", "model.layers.14.mlp.experts.76.up_proj", "model.layers.14.mlp.experts.77.up_proj", "model.layers.14.mlp.experts.78.up_proj", "model.layers.14.mlp.experts.79.up_proj", "model.layers.14.mlp.experts.80.up_proj", "model.layers.14.mlp.experts.81.up_proj", "model.layers.14.mlp.experts.82.up_proj", "model.layers.14.mlp.experts.83.up_proj", "model.layers.14.mlp.experts.84.up_proj", "model.layers.14.mlp.experts.85.up_proj", "model.layers.14.mlp.experts.86.up_proj", "model.layers.14.mlp.experts.87.up_proj", "model.layers.14.mlp.experts.88.up_proj", "model.layers.14.mlp.experts.89.up_proj", "model.layers.14.mlp.experts.90.up_proj", "model.layers.14.mlp.experts.91.up_proj", "model.layers.14.mlp.experts.92.up_proj", "model.layers.14.mlp.experts.93.up_proj", "model.layers.14.mlp.experts.94.up_proj", "model.layers.14.mlp.experts.95.up_proj", "model.layers.14.mlp.experts.96.up_proj", "model.layers.14.mlp.experts.97.up_proj", "model.layers.14.mlp.experts.98.up_proj", "model.layers.14.mlp.experts.99.up_proj", "model.layers.14.mlp.experts.100.up_proj", "model.layers.14.mlp.experts.101.up_proj", "model.layers.14.mlp.experts.102.up_proj", "model.layers.14.mlp.experts.103.up_proj", "model.layers.14.mlp.experts.104.up_proj", "model.layers.14.mlp.experts.105.up_proj", "model.layers.14.mlp.experts.106.up_proj", "model.layers.14.mlp.experts.107.up_proj", "model.layers.14.mlp.experts.108.up_proj", "model.layers.14.mlp.experts.109.up_proj", "model.layers.14.mlp.experts.110.up_proj", "model.layers.14.mlp.experts.111.up_proj", "model.layers.14.mlp.experts.112.up_proj", "model.layers.14.mlp.experts.113.up_proj", "model.layers.14.mlp.experts.114.up_proj", "model.layers.14.mlp.experts.115.up_proj", "model.layers.14.mlp.experts.116.up_proj", "model.layers.14.mlp.experts.117.up_proj", "model.layers.14.mlp.experts.118.up_proj", "model.layers.14.mlp.experts.119.up_proj", "model.layers.14.mlp.experts.120.up_proj", "model.layers.14.mlp.experts.121.up_proj", "model.layers.14.mlp.experts.122.up_proj", "model.layers.14.mlp.experts.123.up_proj", "model.layers.14.mlp.experts.124.up_proj", "model.layers.14.mlp.experts.125.up_proj", "model.layers.14.mlp.experts.126.up_proj", "model.layers.14.mlp.experts.127.up_proj", "model.layers.14.mlp.experts.128.up_proj", "model.layers.14.mlp.experts.129.up_proj", "model.layers.14.mlp.experts.130.up_proj", "model.layers.14.mlp.experts.131.up_proj", "model.layers.14.mlp.experts.132.up_proj", "model.layers.14.mlp.experts.133.up_proj", "model.layers.14.mlp.experts.134.up_proj", "model.layers.14.mlp.experts.135.up_proj", "model.layers.14.mlp.experts.136.up_proj", "model.layers.14.mlp.experts.137.up_proj", "model.layers.14.mlp.experts.138.up_proj", "model.layers.14.mlp.experts.139.up_proj", "model.layers.14.mlp.experts.140.up_proj", "model.layers.14.mlp.experts.141.up_proj", "model.layers.14.mlp.experts.142.up_proj", "model.layers.14.mlp.experts.143.up_proj", "model.layers.14.mlp.experts.144.up_proj", "model.layers.14.mlp.experts.145.up_proj", "model.layers.14.mlp.experts.146.up_proj", "model.layers.14.mlp.experts.147.up_proj", "model.layers.14.mlp.experts.148.up_proj", "model.layers.14.mlp.experts.149.up_proj", "model.layers.14.mlp.experts.150.up_proj", "model.layers.14.mlp.experts.151.up_proj", "model.layers.14.mlp.experts.152.up_proj", "model.layers.14.mlp.experts.153.up_proj", "model.layers.14.mlp.experts.154.up_proj", "model.layers.14.mlp.experts.155.up_proj", "model.layers.14.mlp.experts.156.up_proj", "model.layers.14.mlp.experts.157.up_proj", "model.layers.14.mlp.experts.158.up_proj", "model.layers.14.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -9.797133971005574e-05, "dbits": 2516582400 }, { "dkld": -0.00010491660796105827, "dbits": 5033164800 } ] }, { "idx": 86, "layers": [ "model.layers.14.mlp.experts.0.down_proj", "model.layers.14.mlp.experts.1.down_proj", "model.layers.14.mlp.experts.2.down_proj", "model.layers.14.mlp.experts.3.down_proj", "model.layers.14.mlp.experts.4.down_proj", "model.layers.14.mlp.experts.5.down_proj", "model.layers.14.mlp.experts.6.down_proj", "model.layers.14.mlp.experts.7.down_proj", "model.layers.14.mlp.experts.8.down_proj", "model.layers.14.mlp.experts.9.down_proj", "model.layers.14.mlp.experts.10.down_proj", "model.layers.14.mlp.experts.11.down_proj", "model.layers.14.mlp.experts.12.down_proj", "model.layers.14.mlp.experts.13.down_proj", "model.layers.14.mlp.experts.14.down_proj", "model.layers.14.mlp.experts.15.down_proj", "model.layers.14.mlp.experts.16.down_proj", "model.layers.14.mlp.experts.17.down_proj", "model.layers.14.mlp.experts.18.down_proj", "model.layers.14.mlp.experts.19.down_proj", "model.layers.14.mlp.experts.20.down_proj", "model.layers.14.mlp.experts.21.down_proj", "model.layers.14.mlp.experts.22.down_proj", "model.layers.14.mlp.experts.23.down_proj", "model.layers.14.mlp.experts.24.down_proj", "model.layers.14.mlp.experts.25.down_proj", "model.layers.14.mlp.experts.26.down_proj", "model.layers.14.mlp.experts.27.down_proj", "model.layers.14.mlp.experts.28.down_proj", "model.layers.14.mlp.experts.29.down_proj", "model.layers.14.mlp.experts.30.down_proj", "model.layers.14.mlp.experts.31.down_proj", "model.layers.14.mlp.experts.32.down_proj", "model.layers.14.mlp.experts.33.down_proj", "model.layers.14.mlp.experts.34.down_proj", "model.layers.14.mlp.experts.35.down_proj", "model.layers.14.mlp.experts.36.down_proj", "model.layers.14.mlp.experts.37.down_proj", "model.layers.14.mlp.experts.38.down_proj", "model.layers.14.mlp.experts.39.down_proj", "model.layers.14.mlp.experts.40.down_proj", "model.layers.14.mlp.experts.41.down_proj", "model.layers.14.mlp.experts.42.down_proj", "model.layers.14.mlp.experts.43.down_proj", "model.layers.14.mlp.experts.44.down_proj", "model.layers.14.mlp.experts.45.down_proj", "model.layers.14.mlp.experts.46.down_proj", "model.layers.14.mlp.experts.47.down_proj", "model.layers.14.mlp.experts.48.down_proj", "model.layers.14.mlp.experts.49.down_proj", "model.layers.14.mlp.experts.50.down_proj", "model.layers.14.mlp.experts.51.down_proj", "model.layers.14.mlp.experts.52.down_proj", "model.layers.14.mlp.experts.53.down_proj", "model.layers.14.mlp.experts.54.down_proj", "model.layers.14.mlp.experts.55.down_proj", "model.layers.14.mlp.experts.56.down_proj", "model.layers.14.mlp.experts.57.down_proj", "model.layers.14.mlp.experts.58.down_proj", "model.layers.14.mlp.experts.59.down_proj", "model.layers.14.mlp.experts.60.down_proj", "model.layers.14.mlp.experts.61.down_proj", "model.layers.14.mlp.experts.62.down_proj", "model.layers.14.mlp.experts.63.down_proj", "model.layers.14.mlp.experts.64.down_proj", "model.layers.14.mlp.experts.65.down_proj", "model.layers.14.mlp.experts.66.down_proj", "model.layers.14.mlp.experts.67.down_proj", "model.layers.14.mlp.experts.68.down_proj", "model.layers.14.mlp.experts.69.down_proj", "model.layers.14.mlp.experts.70.down_proj", "model.layers.14.mlp.experts.71.down_proj", "model.layers.14.mlp.experts.72.down_proj", "model.layers.14.mlp.experts.73.down_proj", "model.layers.14.mlp.experts.74.down_proj", "model.layers.14.mlp.experts.75.down_proj", "model.layers.14.mlp.experts.76.down_proj", "model.layers.14.mlp.experts.77.down_proj", "model.layers.14.mlp.experts.78.down_proj", "model.layers.14.mlp.experts.79.down_proj", "model.layers.14.mlp.experts.80.down_proj", "model.layers.14.mlp.experts.81.down_proj", "model.layers.14.mlp.experts.82.down_proj", "model.layers.14.mlp.experts.83.down_proj", "model.layers.14.mlp.experts.84.down_proj", "model.layers.14.mlp.experts.85.down_proj", "model.layers.14.mlp.experts.86.down_proj", "model.layers.14.mlp.experts.87.down_proj", "model.layers.14.mlp.experts.88.down_proj", "model.layers.14.mlp.experts.89.down_proj", "model.layers.14.mlp.experts.90.down_proj", "model.layers.14.mlp.experts.91.down_proj", "model.layers.14.mlp.experts.92.down_proj", "model.layers.14.mlp.experts.93.down_proj", "model.layers.14.mlp.experts.94.down_proj", "model.layers.14.mlp.experts.95.down_proj", "model.layers.14.mlp.experts.96.down_proj", "model.layers.14.mlp.experts.97.down_proj", "model.layers.14.mlp.experts.98.down_proj", "model.layers.14.mlp.experts.99.down_proj", "model.layers.14.mlp.experts.100.down_proj", "model.layers.14.mlp.experts.101.down_proj", "model.layers.14.mlp.experts.102.down_proj", "model.layers.14.mlp.experts.103.down_proj", "model.layers.14.mlp.experts.104.down_proj", "model.layers.14.mlp.experts.105.down_proj", "model.layers.14.mlp.experts.106.down_proj", "model.layers.14.mlp.experts.107.down_proj", "model.layers.14.mlp.experts.108.down_proj", "model.layers.14.mlp.experts.109.down_proj", "model.layers.14.mlp.experts.110.down_proj", "model.layers.14.mlp.experts.111.down_proj", "model.layers.14.mlp.experts.112.down_proj", "model.layers.14.mlp.experts.113.down_proj", "model.layers.14.mlp.experts.114.down_proj", "model.layers.14.mlp.experts.115.down_proj", "model.layers.14.mlp.experts.116.down_proj", "model.layers.14.mlp.experts.117.down_proj", "model.layers.14.mlp.experts.118.down_proj", "model.layers.14.mlp.experts.119.down_proj", "model.layers.14.mlp.experts.120.down_proj", "model.layers.14.mlp.experts.121.down_proj", "model.layers.14.mlp.experts.122.down_proj", "model.layers.14.mlp.experts.123.down_proj", "model.layers.14.mlp.experts.124.down_proj", "model.layers.14.mlp.experts.125.down_proj", "model.layers.14.mlp.experts.126.down_proj", "model.layers.14.mlp.experts.127.down_proj", "model.layers.14.mlp.experts.128.down_proj", "model.layers.14.mlp.experts.129.down_proj", "model.layers.14.mlp.experts.130.down_proj", "model.layers.14.mlp.experts.131.down_proj", "model.layers.14.mlp.experts.132.down_proj", "model.layers.14.mlp.experts.133.down_proj", "model.layers.14.mlp.experts.134.down_proj", "model.layers.14.mlp.experts.135.down_proj", "model.layers.14.mlp.experts.136.down_proj", "model.layers.14.mlp.experts.137.down_proj", "model.layers.14.mlp.experts.138.down_proj", "model.layers.14.mlp.experts.139.down_proj", "model.layers.14.mlp.experts.140.down_proj", "model.layers.14.mlp.experts.141.down_proj", "model.layers.14.mlp.experts.142.down_proj", "model.layers.14.mlp.experts.143.down_proj", "model.layers.14.mlp.experts.144.down_proj", "model.layers.14.mlp.experts.145.down_proj", "model.layers.14.mlp.experts.146.down_proj", "model.layers.14.mlp.experts.147.down_proj", "model.layers.14.mlp.experts.148.down_proj", "model.layers.14.mlp.experts.149.down_proj", "model.layers.14.mlp.experts.150.down_proj", "model.layers.14.mlp.experts.151.down_proj", "model.layers.14.mlp.experts.152.down_proj", "model.layers.14.mlp.experts.153.down_proj", "model.layers.14.mlp.experts.154.down_proj", "model.layers.14.mlp.experts.155.down_proj", "model.layers.14.mlp.experts.156.down_proj", "model.layers.14.mlp.experts.157.down_proj", "model.layers.14.mlp.experts.158.down_proj", "model.layers.14.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -9.803595021366969e-05, "dbits": 1258291200 }, { "dkld": -0.00013570180162787368, "dbits": 2516582400 } ] }, { "idx": 87, "layers": [ "model.layers.15.self_attn.q_proj" ], "candidates": [ { "dkld": -6.956048309789131e-07, "dbits": 62914560 }, { "dkld": -1.7254147678613663e-05, "dbits": 125829120 } ] }, { "idx": 88, "layers": [ "model.layers.15.self_attn.k_proj", "model.layers.15.self_attn.v_proj" ], "candidates": [ { "dkld": -8.71689058840261e-05, "dbits": 10485760 }, { "dkld": -6.50487374514331e-05, "dbits": 20971520 } ] }, { "idx": 89, "layers": [ "model.layers.15.self_attn.o_proj" ], "candidates": [ { "dkld": -6.494808476418222e-05, "dbits": 62914560 }, { "dkld": -0.00012208353728055885, "dbits": 125829120 } ] }, { "idx": 90, "layers": [ "model.layers.15.mlp.shared_experts.gate_proj", "model.layers.15.mlp.shared_experts.up_proj", "model.layers.15.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -1.1168862693011414e-05, "dbits": 23592960 }, { "dkld": -1.5342002734541546e-05, "dbits": 47185920 } ] }, { "idx": 91, "layers": [ "model.layers.15.mlp.experts.0.gate_proj", "model.layers.15.mlp.experts.1.gate_proj", "model.layers.15.mlp.experts.2.gate_proj", "model.layers.15.mlp.experts.3.gate_proj", "model.layers.15.mlp.experts.4.gate_proj", "model.layers.15.mlp.experts.5.gate_proj", "model.layers.15.mlp.experts.6.gate_proj", "model.layers.15.mlp.experts.7.gate_proj", "model.layers.15.mlp.experts.8.gate_proj", "model.layers.15.mlp.experts.9.gate_proj", "model.layers.15.mlp.experts.10.gate_proj", "model.layers.15.mlp.experts.11.gate_proj", "model.layers.15.mlp.experts.12.gate_proj", "model.layers.15.mlp.experts.13.gate_proj", "model.layers.15.mlp.experts.14.gate_proj", "model.layers.15.mlp.experts.15.gate_proj", "model.layers.15.mlp.experts.16.gate_proj", "model.layers.15.mlp.experts.17.gate_proj", "model.layers.15.mlp.experts.18.gate_proj", "model.layers.15.mlp.experts.19.gate_proj", "model.layers.15.mlp.experts.20.gate_proj", "model.layers.15.mlp.experts.21.gate_proj", "model.layers.15.mlp.experts.22.gate_proj", "model.layers.15.mlp.experts.23.gate_proj", "model.layers.15.mlp.experts.24.gate_proj", "model.layers.15.mlp.experts.25.gate_proj", "model.layers.15.mlp.experts.26.gate_proj", "model.layers.15.mlp.experts.27.gate_proj", "model.layers.15.mlp.experts.28.gate_proj", "model.layers.15.mlp.experts.29.gate_proj", "model.layers.15.mlp.experts.30.gate_proj", "model.layers.15.mlp.experts.31.gate_proj", "model.layers.15.mlp.experts.32.gate_proj", "model.layers.15.mlp.experts.33.gate_proj", "model.layers.15.mlp.experts.34.gate_proj", "model.layers.15.mlp.experts.35.gate_proj", "model.layers.15.mlp.experts.36.gate_proj", "model.layers.15.mlp.experts.37.gate_proj", "model.layers.15.mlp.experts.38.gate_proj", "model.layers.15.mlp.experts.39.gate_proj", "model.layers.15.mlp.experts.40.gate_proj", "model.layers.15.mlp.experts.41.gate_proj", "model.layers.15.mlp.experts.42.gate_proj", "model.layers.15.mlp.experts.43.gate_proj", "model.layers.15.mlp.experts.44.gate_proj", "model.layers.15.mlp.experts.45.gate_proj", "model.layers.15.mlp.experts.46.gate_proj", "model.layers.15.mlp.experts.47.gate_proj", "model.layers.15.mlp.experts.48.gate_proj", "model.layers.15.mlp.experts.49.gate_proj", "model.layers.15.mlp.experts.50.gate_proj", "model.layers.15.mlp.experts.51.gate_proj", "model.layers.15.mlp.experts.52.gate_proj", "model.layers.15.mlp.experts.53.gate_proj", "model.layers.15.mlp.experts.54.gate_proj", "model.layers.15.mlp.experts.55.gate_proj", "model.layers.15.mlp.experts.56.gate_proj", "model.layers.15.mlp.experts.57.gate_proj", "model.layers.15.mlp.experts.58.gate_proj", "model.layers.15.mlp.experts.59.gate_proj", "model.layers.15.mlp.experts.60.gate_proj", "model.layers.15.mlp.experts.61.gate_proj", "model.layers.15.mlp.experts.62.gate_proj", "model.layers.15.mlp.experts.63.gate_proj", "model.layers.15.mlp.experts.64.gate_proj", "model.layers.15.mlp.experts.65.gate_proj", "model.layers.15.mlp.experts.66.gate_proj", "model.layers.15.mlp.experts.67.gate_proj", "model.layers.15.mlp.experts.68.gate_proj", "model.layers.15.mlp.experts.69.gate_proj", "model.layers.15.mlp.experts.70.gate_proj", "model.layers.15.mlp.experts.71.gate_proj", "model.layers.15.mlp.experts.72.gate_proj", "model.layers.15.mlp.experts.73.gate_proj", "model.layers.15.mlp.experts.74.gate_proj", "model.layers.15.mlp.experts.75.gate_proj", "model.layers.15.mlp.experts.76.gate_proj", "model.layers.15.mlp.experts.77.gate_proj", "model.layers.15.mlp.experts.78.gate_proj", "model.layers.15.mlp.experts.79.gate_proj", "model.layers.15.mlp.experts.80.gate_proj", "model.layers.15.mlp.experts.81.gate_proj", "model.layers.15.mlp.experts.82.gate_proj", "model.layers.15.mlp.experts.83.gate_proj", "model.layers.15.mlp.experts.84.gate_proj", "model.layers.15.mlp.experts.85.gate_proj", "model.layers.15.mlp.experts.86.gate_proj", "model.layers.15.mlp.experts.87.gate_proj", "model.layers.15.mlp.experts.88.gate_proj", "model.layers.15.mlp.experts.89.gate_proj", "model.layers.15.mlp.experts.90.gate_proj", "model.layers.15.mlp.experts.91.gate_proj", "model.layers.15.mlp.experts.92.gate_proj", "model.layers.15.mlp.experts.93.gate_proj", "model.layers.15.mlp.experts.94.gate_proj", "model.layers.15.mlp.experts.95.gate_proj", "model.layers.15.mlp.experts.96.gate_proj", "model.layers.15.mlp.experts.97.gate_proj", "model.layers.15.mlp.experts.98.gate_proj", "model.layers.15.mlp.experts.99.gate_proj", "model.layers.15.mlp.experts.100.gate_proj", "model.layers.15.mlp.experts.101.gate_proj", "model.layers.15.mlp.experts.102.gate_proj", "model.layers.15.mlp.experts.103.gate_proj", "model.layers.15.mlp.experts.104.gate_proj", "model.layers.15.mlp.experts.105.gate_proj", "model.layers.15.mlp.experts.106.gate_proj", "model.layers.15.mlp.experts.107.gate_proj", "model.layers.15.mlp.experts.108.gate_proj", "model.layers.15.mlp.experts.109.gate_proj", "model.layers.15.mlp.experts.110.gate_proj", "model.layers.15.mlp.experts.111.gate_proj", "model.layers.15.mlp.experts.112.gate_proj", "model.layers.15.mlp.experts.113.gate_proj", "model.layers.15.mlp.experts.114.gate_proj", "model.layers.15.mlp.experts.115.gate_proj", "model.layers.15.mlp.experts.116.gate_proj", "model.layers.15.mlp.experts.117.gate_proj", "model.layers.15.mlp.experts.118.gate_proj", "model.layers.15.mlp.experts.119.gate_proj", "model.layers.15.mlp.experts.120.gate_proj", "model.layers.15.mlp.experts.121.gate_proj", "model.layers.15.mlp.experts.122.gate_proj", "model.layers.15.mlp.experts.123.gate_proj", "model.layers.15.mlp.experts.124.gate_proj", "model.layers.15.mlp.experts.125.gate_proj", "model.layers.15.mlp.experts.126.gate_proj", "model.layers.15.mlp.experts.127.gate_proj", "model.layers.15.mlp.experts.128.gate_proj", "model.layers.15.mlp.experts.129.gate_proj", "model.layers.15.mlp.experts.130.gate_proj", "model.layers.15.mlp.experts.131.gate_proj", "model.layers.15.mlp.experts.132.gate_proj", "model.layers.15.mlp.experts.133.gate_proj", "model.layers.15.mlp.experts.134.gate_proj", "model.layers.15.mlp.experts.135.gate_proj", "model.layers.15.mlp.experts.136.gate_proj", "model.layers.15.mlp.experts.137.gate_proj", "model.layers.15.mlp.experts.138.gate_proj", "model.layers.15.mlp.experts.139.gate_proj", "model.layers.15.mlp.experts.140.gate_proj", "model.layers.15.mlp.experts.141.gate_proj", "model.layers.15.mlp.experts.142.gate_proj", "model.layers.15.mlp.experts.143.gate_proj", "model.layers.15.mlp.experts.144.gate_proj", "model.layers.15.mlp.experts.145.gate_proj", "model.layers.15.mlp.experts.146.gate_proj", "model.layers.15.mlp.experts.147.gate_proj", "model.layers.15.mlp.experts.148.gate_proj", "model.layers.15.mlp.experts.149.gate_proj", "model.layers.15.mlp.experts.150.gate_proj", "model.layers.15.mlp.experts.151.gate_proj", "model.layers.15.mlp.experts.152.gate_proj", "model.layers.15.mlp.experts.153.gate_proj", "model.layers.15.mlp.experts.154.gate_proj", "model.layers.15.mlp.experts.155.gate_proj", "model.layers.15.mlp.experts.156.gate_proj", "model.layers.15.mlp.experts.157.gate_proj", "model.layers.15.mlp.experts.158.gate_proj", "model.layers.15.mlp.experts.159.gate_proj", "model.layers.15.mlp.experts.0.up_proj", "model.layers.15.mlp.experts.1.up_proj", "model.layers.15.mlp.experts.2.up_proj", "model.layers.15.mlp.experts.3.up_proj", "model.layers.15.mlp.experts.4.up_proj", "model.layers.15.mlp.experts.5.up_proj", "model.layers.15.mlp.experts.6.up_proj", "model.layers.15.mlp.experts.7.up_proj", "model.layers.15.mlp.experts.8.up_proj", "model.layers.15.mlp.experts.9.up_proj", "model.layers.15.mlp.experts.10.up_proj", "model.layers.15.mlp.experts.11.up_proj", "model.layers.15.mlp.experts.12.up_proj", "model.layers.15.mlp.experts.13.up_proj", "model.layers.15.mlp.experts.14.up_proj", "model.layers.15.mlp.experts.15.up_proj", "model.layers.15.mlp.experts.16.up_proj", "model.layers.15.mlp.experts.17.up_proj", "model.layers.15.mlp.experts.18.up_proj", "model.layers.15.mlp.experts.19.up_proj", "model.layers.15.mlp.experts.20.up_proj", "model.layers.15.mlp.experts.21.up_proj", "model.layers.15.mlp.experts.22.up_proj", "model.layers.15.mlp.experts.23.up_proj", "model.layers.15.mlp.experts.24.up_proj", "model.layers.15.mlp.experts.25.up_proj", "model.layers.15.mlp.experts.26.up_proj", "model.layers.15.mlp.experts.27.up_proj", "model.layers.15.mlp.experts.28.up_proj", "model.layers.15.mlp.experts.29.up_proj", "model.layers.15.mlp.experts.30.up_proj", "model.layers.15.mlp.experts.31.up_proj", "model.layers.15.mlp.experts.32.up_proj", "model.layers.15.mlp.experts.33.up_proj", "model.layers.15.mlp.experts.34.up_proj", "model.layers.15.mlp.experts.35.up_proj", "model.layers.15.mlp.experts.36.up_proj", "model.layers.15.mlp.experts.37.up_proj", "model.layers.15.mlp.experts.38.up_proj", "model.layers.15.mlp.experts.39.up_proj", "model.layers.15.mlp.experts.40.up_proj", "model.layers.15.mlp.experts.41.up_proj", "model.layers.15.mlp.experts.42.up_proj", "model.layers.15.mlp.experts.43.up_proj", "model.layers.15.mlp.experts.44.up_proj", "model.layers.15.mlp.experts.45.up_proj", "model.layers.15.mlp.experts.46.up_proj", "model.layers.15.mlp.experts.47.up_proj", "model.layers.15.mlp.experts.48.up_proj", "model.layers.15.mlp.experts.49.up_proj", "model.layers.15.mlp.experts.50.up_proj", "model.layers.15.mlp.experts.51.up_proj", "model.layers.15.mlp.experts.52.up_proj", "model.layers.15.mlp.experts.53.up_proj", "model.layers.15.mlp.experts.54.up_proj", "model.layers.15.mlp.experts.55.up_proj", "model.layers.15.mlp.experts.56.up_proj", "model.layers.15.mlp.experts.57.up_proj", "model.layers.15.mlp.experts.58.up_proj", "model.layers.15.mlp.experts.59.up_proj", "model.layers.15.mlp.experts.60.up_proj", "model.layers.15.mlp.experts.61.up_proj", "model.layers.15.mlp.experts.62.up_proj", "model.layers.15.mlp.experts.63.up_proj", "model.layers.15.mlp.experts.64.up_proj", "model.layers.15.mlp.experts.65.up_proj", "model.layers.15.mlp.experts.66.up_proj", "model.layers.15.mlp.experts.67.up_proj", "model.layers.15.mlp.experts.68.up_proj", "model.layers.15.mlp.experts.69.up_proj", "model.layers.15.mlp.experts.70.up_proj", "model.layers.15.mlp.experts.71.up_proj", "model.layers.15.mlp.experts.72.up_proj", "model.layers.15.mlp.experts.73.up_proj", "model.layers.15.mlp.experts.74.up_proj", "model.layers.15.mlp.experts.75.up_proj", "model.layers.15.mlp.experts.76.up_proj", "model.layers.15.mlp.experts.77.up_proj", "model.layers.15.mlp.experts.78.up_proj", "model.layers.15.mlp.experts.79.up_proj", "model.layers.15.mlp.experts.80.up_proj", "model.layers.15.mlp.experts.81.up_proj", "model.layers.15.mlp.experts.82.up_proj", "model.layers.15.mlp.experts.83.up_proj", "model.layers.15.mlp.experts.84.up_proj", "model.layers.15.mlp.experts.85.up_proj", "model.layers.15.mlp.experts.86.up_proj", "model.layers.15.mlp.experts.87.up_proj", "model.layers.15.mlp.experts.88.up_proj", "model.layers.15.mlp.experts.89.up_proj", "model.layers.15.mlp.experts.90.up_proj", "model.layers.15.mlp.experts.91.up_proj", "model.layers.15.mlp.experts.92.up_proj", "model.layers.15.mlp.experts.93.up_proj", "model.layers.15.mlp.experts.94.up_proj", "model.layers.15.mlp.experts.95.up_proj", "model.layers.15.mlp.experts.96.up_proj", "model.layers.15.mlp.experts.97.up_proj", "model.layers.15.mlp.experts.98.up_proj", "model.layers.15.mlp.experts.99.up_proj", "model.layers.15.mlp.experts.100.up_proj", "model.layers.15.mlp.experts.101.up_proj", "model.layers.15.mlp.experts.102.up_proj", "model.layers.15.mlp.experts.103.up_proj", "model.layers.15.mlp.experts.104.up_proj", "model.layers.15.mlp.experts.105.up_proj", "model.layers.15.mlp.experts.106.up_proj", "model.layers.15.mlp.experts.107.up_proj", "model.layers.15.mlp.experts.108.up_proj", "model.layers.15.mlp.experts.109.up_proj", "model.layers.15.mlp.experts.110.up_proj", "model.layers.15.mlp.experts.111.up_proj", "model.layers.15.mlp.experts.112.up_proj", "model.layers.15.mlp.experts.113.up_proj", "model.layers.15.mlp.experts.114.up_proj", "model.layers.15.mlp.experts.115.up_proj", "model.layers.15.mlp.experts.116.up_proj", "model.layers.15.mlp.experts.117.up_proj", "model.layers.15.mlp.experts.118.up_proj", "model.layers.15.mlp.experts.119.up_proj", "model.layers.15.mlp.experts.120.up_proj", "model.layers.15.mlp.experts.121.up_proj", "model.layers.15.mlp.experts.122.up_proj", "model.layers.15.mlp.experts.123.up_proj", "model.layers.15.mlp.experts.124.up_proj", "model.layers.15.mlp.experts.125.up_proj", "model.layers.15.mlp.experts.126.up_proj", "model.layers.15.mlp.experts.127.up_proj", "model.layers.15.mlp.experts.128.up_proj", "model.layers.15.mlp.experts.129.up_proj", "model.layers.15.mlp.experts.130.up_proj", "model.layers.15.mlp.experts.131.up_proj", "model.layers.15.mlp.experts.132.up_proj", "model.layers.15.mlp.experts.133.up_proj", "model.layers.15.mlp.experts.134.up_proj", "model.layers.15.mlp.experts.135.up_proj", "model.layers.15.mlp.experts.136.up_proj", "model.layers.15.mlp.experts.137.up_proj", "model.layers.15.mlp.experts.138.up_proj", "model.layers.15.mlp.experts.139.up_proj", "model.layers.15.mlp.experts.140.up_proj", "model.layers.15.mlp.experts.141.up_proj", "model.layers.15.mlp.experts.142.up_proj", "model.layers.15.mlp.experts.143.up_proj", "model.layers.15.mlp.experts.144.up_proj", "model.layers.15.mlp.experts.145.up_proj", "model.layers.15.mlp.experts.146.up_proj", "model.layers.15.mlp.experts.147.up_proj", "model.layers.15.mlp.experts.148.up_proj", "model.layers.15.mlp.experts.149.up_proj", "model.layers.15.mlp.experts.150.up_proj", "model.layers.15.mlp.experts.151.up_proj", "model.layers.15.mlp.experts.152.up_proj", "model.layers.15.mlp.experts.153.up_proj", "model.layers.15.mlp.experts.154.up_proj", "model.layers.15.mlp.experts.155.up_proj", "model.layers.15.mlp.experts.156.up_proj", "model.layers.15.mlp.experts.157.up_proj", "model.layers.15.mlp.experts.158.up_proj", "model.layers.15.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -9.775254875421177e-06, "dbits": 2516582400 }, { "dkld": -2.6113656349479458e-05, "dbits": 5033164800 } ] }, { "idx": 92, "layers": [ "model.layers.15.mlp.experts.0.down_proj", "model.layers.15.mlp.experts.1.down_proj", "model.layers.15.mlp.experts.2.down_proj", "model.layers.15.mlp.experts.3.down_proj", "model.layers.15.mlp.experts.4.down_proj", "model.layers.15.mlp.experts.5.down_proj", "model.layers.15.mlp.experts.6.down_proj", "model.layers.15.mlp.experts.7.down_proj", "model.layers.15.mlp.experts.8.down_proj", "model.layers.15.mlp.experts.9.down_proj", "model.layers.15.mlp.experts.10.down_proj", "model.layers.15.mlp.experts.11.down_proj", "model.layers.15.mlp.experts.12.down_proj", "model.layers.15.mlp.experts.13.down_proj", "model.layers.15.mlp.experts.14.down_proj", "model.layers.15.mlp.experts.15.down_proj", "model.layers.15.mlp.experts.16.down_proj", "model.layers.15.mlp.experts.17.down_proj", "model.layers.15.mlp.experts.18.down_proj", "model.layers.15.mlp.experts.19.down_proj", "model.layers.15.mlp.experts.20.down_proj", "model.layers.15.mlp.experts.21.down_proj", "model.layers.15.mlp.experts.22.down_proj", "model.layers.15.mlp.experts.23.down_proj", "model.layers.15.mlp.experts.24.down_proj", "model.layers.15.mlp.experts.25.down_proj", "model.layers.15.mlp.experts.26.down_proj", "model.layers.15.mlp.experts.27.down_proj", "model.layers.15.mlp.experts.28.down_proj", "model.layers.15.mlp.experts.29.down_proj", "model.layers.15.mlp.experts.30.down_proj", "model.layers.15.mlp.experts.31.down_proj", "model.layers.15.mlp.experts.32.down_proj", "model.layers.15.mlp.experts.33.down_proj", "model.layers.15.mlp.experts.34.down_proj", "model.layers.15.mlp.experts.35.down_proj", "model.layers.15.mlp.experts.36.down_proj", "model.layers.15.mlp.experts.37.down_proj", "model.layers.15.mlp.experts.38.down_proj", "model.layers.15.mlp.experts.39.down_proj", "model.layers.15.mlp.experts.40.down_proj", "model.layers.15.mlp.experts.41.down_proj", "model.layers.15.mlp.experts.42.down_proj", "model.layers.15.mlp.experts.43.down_proj", "model.layers.15.mlp.experts.44.down_proj", "model.layers.15.mlp.experts.45.down_proj", "model.layers.15.mlp.experts.46.down_proj", "model.layers.15.mlp.experts.47.down_proj", "model.layers.15.mlp.experts.48.down_proj", "model.layers.15.mlp.experts.49.down_proj", "model.layers.15.mlp.experts.50.down_proj", "model.layers.15.mlp.experts.51.down_proj", "model.layers.15.mlp.experts.52.down_proj", "model.layers.15.mlp.experts.53.down_proj", "model.layers.15.mlp.experts.54.down_proj", "model.layers.15.mlp.experts.55.down_proj", "model.layers.15.mlp.experts.56.down_proj", "model.layers.15.mlp.experts.57.down_proj", "model.layers.15.mlp.experts.58.down_proj", "model.layers.15.mlp.experts.59.down_proj", "model.layers.15.mlp.experts.60.down_proj", "model.layers.15.mlp.experts.61.down_proj", "model.layers.15.mlp.experts.62.down_proj", "model.layers.15.mlp.experts.63.down_proj", "model.layers.15.mlp.experts.64.down_proj", "model.layers.15.mlp.experts.65.down_proj", "model.layers.15.mlp.experts.66.down_proj", "model.layers.15.mlp.experts.67.down_proj", "model.layers.15.mlp.experts.68.down_proj", "model.layers.15.mlp.experts.69.down_proj", "model.layers.15.mlp.experts.70.down_proj", "model.layers.15.mlp.experts.71.down_proj", "model.layers.15.mlp.experts.72.down_proj", "model.layers.15.mlp.experts.73.down_proj", "model.layers.15.mlp.experts.74.down_proj", "model.layers.15.mlp.experts.75.down_proj", "model.layers.15.mlp.experts.76.down_proj", "model.layers.15.mlp.experts.77.down_proj", "model.layers.15.mlp.experts.78.down_proj", "model.layers.15.mlp.experts.79.down_proj", "model.layers.15.mlp.experts.80.down_proj", "model.layers.15.mlp.experts.81.down_proj", "model.layers.15.mlp.experts.82.down_proj", "model.layers.15.mlp.experts.83.down_proj", "model.layers.15.mlp.experts.84.down_proj", "model.layers.15.mlp.experts.85.down_proj", "model.layers.15.mlp.experts.86.down_proj", "model.layers.15.mlp.experts.87.down_proj", "model.layers.15.mlp.experts.88.down_proj", "model.layers.15.mlp.experts.89.down_proj", "model.layers.15.mlp.experts.90.down_proj", "model.layers.15.mlp.experts.91.down_proj", "model.layers.15.mlp.experts.92.down_proj", "model.layers.15.mlp.experts.93.down_proj", "model.layers.15.mlp.experts.94.down_proj", "model.layers.15.mlp.experts.95.down_proj", "model.layers.15.mlp.experts.96.down_proj", "model.layers.15.mlp.experts.97.down_proj", "model.layers.15.mlp.experts.98.down_proj", "model.layers.15.mlp.experts.99.down_proj", "model.layers.15.mlp.experts.100.down_proj", "model.layers.15.mlp.experts.101.down_proj", "model.layers.15.mlp.experts.102.down_proj", "model.layers.15.mlp.experts.103.down_proj", "model.layers.15.mlp.experts.104.down_proj", "model.layers.15.mlp.experts.105.down_proj", "model.layers.15.mlp.experts.106.down_proj", "model.layers.15.mlp.experts.107.down_proj", "model.layers.15.mlp.experts.108.down_proj", "model.layers.15.mlp.experts.109.down_proj", "model.layers.15.mlp.experts.110.down_proj", "model.layers.15.mlp.experts.111.down_proj", "model.layers.15.mlp.experts.112.down_proj", "model.layers.15.mlp.experts.113.down_proj", "model.layers.15.mlp.experts.114.down_proj", "model.layers.15.mlp.experts.115.down_proj", "model.layers.15.mlp.experts.116.down_proj", "model.layers.15.mlp.experts.117.down_proj", "model.layers.15.mlp.experts.118.down_proj", "model.layers.15.mlp.experts.119.down_proj", "model.layers.15.mlp.experts.120.down_proj", "model.layers.15.mlp.experts.121.down_proj", "model.layers.15.mlp.experts.122.down_proj", "model.layers.15.mlp.experts.123.down_proj", "model.layers.15.mlp.experts.124.down_proj", "model.layers.15.mlp.experts.125.down_proj", "model.layers.15.mlp.experts.126.down_proj", "model.layers.15.mlp.experts.127.down_proj", "model.layers.15.mlp.experts.128.down_proj", "model.layers.15.mlp.experts.129.down_proj", "model.layers.15.mlp.experts.130.down_proj", "model.layers.15.mlp.experts.131.down_proj", "model.layers.15.mlp.experts.132.down_proj", "model.layers.15.mlp.experts.133.down_proj", "model.layers.15.mlp.experts.134.down_proj", "model.layers.15.mlp.experts.135.down_proj", "model.layers.15.mlp.experts.136.down_proj", "model.layers.15.mlp.experts.137.down_proj", "model.layers.15.mlp.experts.138.down_proj", "model.layers.15.mlp.experts.139.down_proj", "model.layers.15.mlp.experts.140.down_proj", "model.layers.15.mlp.experts.141.down_proj", "model.layers.15.mlp.experts.142.down_proj", "model.layers.15.mlp.experts.143.down_proj", "model.layers.15.mlp.experts.144.down_proj", "model.layers.15.mlp.experts.145.down_proj", "model.layers.15.mlp.experts.146.down_proj", "model.layers.15.mlp.experts.147.down_proj", "model.layers.15.mlp.experts.148.down_proj", "model.layers.15.mlp.experts.149.down_proj", "model.layers.15.mlp.experts.150.down_proj", "model.layers.15.mlp.experts.151.down_proj", "model.layers.15.mlp.experts.152.down_proj", "model.layers.15.mlp.experts.153.down_proj", "model.layers.15.mlp.experts.154.down_proj", "model.layers.15.mlp.experts.155.down_proj", "model.layers.15.mlp.experts.156.down_proj", "model.layers.15.mlp.experts.157.down_proj", "model.layers.15.mlp.experts.158.down_proj", "model.layers.15.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -6.633403245359659e-05, "dbits": 1258291200 }, { "dkld": -5.082911811768974e-05, "dbits": 2516582400 } ] }, { "idx": 93, "layers": [ "model.layers.16.self_attn.q_proj" ], "candidates": [ { "dkld": 4.343045875430246e-05, "dbits": 62914560 }, { "dkld": 6.0856109485030174e-06, "dbits": 125829120 } ] }, { "idx": 94, "layers": [ "model.layers.16.self_attn.k_proj", "model.layers.16.self_attn.v_proj" ], "candidates": [ { "dkld": -2.018010709434713e-05, "dbits": 10485760 }, { "dkld": -3.7035904824733734e-05, "dbits": 20971520 } ] }, { "idx": 95, "layers": [ "model.layers.16.self_attn.o_proj" ], "candidates": [ { "dkld": -0.00015032812952995266, "dbits": 62914560 }, { "dkld": -0.0001175494864583005, "dbits": 125829120 } ] }, { "idx": 96, "layers": [ "model.layers.16.mlp.shared_experts.gate_proj", "model.layers.16.mlp.shared_experts.up_proj", "model.layers.16.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -6.298928055912222e-05, "dbits": 23592960 }, { "dkld": -6.495607085525885e-05, "dbits": 47185920 } ] }, { "idx": 97, "layers": [ "model.layers.16.mlp.experts.0.gate_proj", "model.layers.16.mlp.experts.1.gate_proj", "model.layers.16.mlp.experts.2.gate_proj", "model.layers.16.mlp.experts.3.gate_proj", "model.layers.16.mlp.experts.4.gate_proj", "model.layers.16.mlp.experts.5.gate_proj", "model.layers.16.mlp.experts.6.gate_proj", "model.layers.16.mlp.experts.7.gate_proj", "model.layers.16.mlp.experts.8.gate_proj", "model.layers.16.mlp.experts.9.gate_proj", "model.layers.16.mlp.experts.10.gate_proj", "model.layers.16.mlp.experts.11.gate_proj", "model.layers.16.mlp.experts.12.gate_proj", "model.layers.16.mlp.experts.13.gate_proj", "model.layers.16.mlp.experts.14.gate_proj", "model.layers.16.mlp.experts.15.gate_proj", "model.layers.16.mlp.experts.16.gate_proj", "model.layers.16.mlp.experts.17.gate_proj", "model.layers.16.mlp.experts.18.gate_proj", "model.layers.16.mlp.experts.19.gate_proj", "model.layers.16.mlp.experts.20.gate_proj", "model.layers.16.mlp.experts.21.gate_proj", "model.layers.16.mlp.experts.22.gate_proj", "model.layers.16.mlp.experts.23.gate_proj", "model.layers.16.mlp.experts.24.gate_proj", "model.layers.16.mlp.experts.25.gate_proj", "model.layers.16.mlp.experts.26.gate_proj", "model.layers.16.mlp.experts.27.gate_proj", "model.layers.16.mlp.experts.28.gate_proj", "model.layers.16.mlp.experts.29.gate_proj", "model.layers.16.mlp.experts.30.gate_proj", "model.layers.16.mlp.experts.31.gate_proj", "model.layers.16.mlp.experts.32.gate_proj", "model.layers.16.mlp.experts.33.gate_proj", "model.layers.16.mlp.experts.34.gate_proj", "model.layers.16.mlp.experts.35.gate_proj", "model.layers.16.mlp.experts.36.gate_proj", "model.layers.16.mlp.experts.37.gate_proj", "model.layers.16.mlp.experts.38.gate_proj", "model.layers.16.mlp.experts.39.gate_proj", "model.layers.16.mlp.experts.40.gate_proj", "model.layers.16.mlp.experts.41.gate_proj", "model.layers.16.mlp.experts.42.gate_proj", "model.layers.16.mlp.experts.43.gate_proj", "model.layers.16.mlp.experts.44.gate_proj", "model.layers.16.mlp.experts.45.gate_proj", "model.layers.16.mlp.experts.46.gate_proj", "model.layers.16.mlp.experts.47.gate_proj", "model.layers.16.mlp.experts.48.gate_proj", "model.layers.16.mlp.experts.49.gate_proj", "model.layers.16.mlp.experts.50.gate_proj", "model.layers.16.mlp.experts.51.gate_proj", "model.layers.16.mlp.experts.52.gate_proj", "model.layers.16.mlp.experts.53.gate_proj", "model.layers.16.mlp.experts.54.gate_proj", "model.layers.16.mlp.experts.55.gate_proj", "model.layers.16.mlp.experts.56.gate_proj", "model.layers.16.mlp.experts.57.gate_proj", "model.layers.16.mlp.experts.58.gate_proj", "model.layers.16.mlp.experts.59.gate_proj", "model.layers.16.mlp.experts.60.gate_proj", "model.layers.16.mlp.experts.61.gate_proj", "model.layers.16.mlp.experts.62.gate_proj", "model.layers.16.mlp.experts.63.gate_proj", "model.layers.16.mlp.experts.64.gate_proj", "model.layers.16.mlp.experts.65.gate_proj", "model.layers.16.mlp.experts.66.gate_proj", "model.layers.16.mlp.experts.67.gate_proj", "model.layers.16.mlp.experts.68.gate_proj", "model.layers.16.mlp.experts.69.gate_proj", "model.layers.16.mlp.experts.70.gate_proj", "model.layers.16.mlp.experts.71.gate_proj", "model.layers.16.mlp.experts.72.gate_proj", "model.layers.16.mlp.experts.73.gate_proj", "model.layers.16.mlp.experts.74.gate_proj", "model.layers.16.mlp.experts.75.gate_proj", "model.layers.16.mlp.experts.76.gate_proj", "model.layers.16.mlp.experts.77.gate_proj", "model.layers.16.mlp.experts.78.gate_proj", "model.layers.16.mlp.experts.79.gate_proj", "model.layers.16.mlp.experts.80.gate_proj", "model.layers.16.mlp.experts.81.gate_proj", "model.layers.16.mlp.experts.82.gate_proj", "model.layers.16.mlp.experts.83.gate_proj", "model.layers.16.mlp.experts.84.gate_proj", "model.layers.16.mlp.experts.85.gate_proj", "model.layers.16.mlp.experts.86.gate_proj", "model.layers.16.mlp.experts.87.gate_proj", "model.layers.16.mlp.experts.88.gate_proj", "model.layers.16.mlp.experts.89.gate_proj", "model.layers.16.mlp.experts.90.gate_proj", "model.layers.16.mlp.experts.91.gate_proj", "model.layers.16.mlp.experts.92.gate_proj", "model.layers.16.mlp.experts.93.gate_proj", "model.layers.16.mlp.experts.94.gate_proj", "model.layers.16.mlp.experts.95.gate_proj", "model.layers.16.mlp.experts.96.gate_proj", "model.layers.16.mlp.experts.97.gate_proj", "model.layers.16.mlp.experts.98.gate_proj", "model.layers.16.mlp.experts.99.gate_proj", "model.layers.16.mlp.experts.100.gate_proj", "model.layers.16.mlp.experts.101.gate_proj", "model.layers.16.mlp.experts.102.gate_proj", "model.layers.16.mlp.experts.103.gate_proj", "model.layers.16.mlp.experts.104.gate_proj", "model.layers.16.mlp.experts.105.gate_proj", "model.layers.16.mlp.experts.106.gate_proj", "model.layers.16.mlp.experts.107.gate_proj", "model.layers.16.mlp.experts.108.gate_proj", "model.layers.16.mlp.experts.109.gate_proj", "model.layers.16.mlp.experts.110.gate_proj", "model.layers.16.mlp.experts.111.gate_proj", "model.layers.16.mlp.experts.112.gate_proj", "model.layers.16.mlp.experts.113.gate_proj", "model.layers.16.mlp.experts.114.gate_proj", "model.layers.16.mlp.experts.115.gate_proj", "model.layers.16.mlp.experts.116.gate_proj", "model.layers.16.mlp.experts.117.gate_proj", "model.layers.16.mlp.experts.118.gate_proj", "model.layers.16.mlp.experts.119.gate_proj", "model.layers.16.mlp.experts.120.gate_proj", "model.layers.16.mlp.experts.121.gate_proj", "model.layers.16.mlp.experts.122.gate_proj", "model.layers.16.mlp.experts.123.gate_proj", "model.layers.16.mlp.experts.124.gate_proj", "model.layers.16.mlp.experts.125.gate_proj", "model.layers.16.mlp.experts.126.gate_proj", "model.layers.16.mlp.experts.127.gate_proj", "model.layers.16.mlp.experts.128.gate_proj", "model.layers.16.mlp.experts.129.gate_proj", "model.layers.16.mlp.experts.130.gate_proj", "model.layers.16.mlp.experts.131.gate_proj", "model.layers.16.mlp.experts.132.gate_proj", "model.layers.16.mlp.experts.133.gate_proj", "model.layers.16.mlp.experts.134.gate_proj", "model.layers.16.mlp.experts.135.gate_proj", "model.layers.16.mlp.experts.136.gate_proj", "model.layers.16.mlp.experts.137.gate_proj", "model.layers.16.mlp.experts.138.gate_proj", "model.layers.16.mlp.experts.139.gate_proj", "model.layers.16.mlp.experts.140.gate_proj", "model.layers.16.mlp.experts.141.gate_proj", "model.layers.16.mlp.experts.142.gate_proj", "model.layers.16.mlp.experts.143.gate_proj", "model.layers.16.mlp.experts.144.gate_proj", "model.layers.16.mlp.experts.145.gate_proj", "model.layers.16.mlp.experts.146.gate_proj", "model.layers.16.mlp.experts.147.gate_proj", "model.layers.16.mlp.experts.148.gate_proj", "model.layers.16.mlp.experts.149.gate_proj", "model.layers.16.mlp.experts.150.gate_proj", "model.layers.16.mlp.experts.151.gate_proj", "model.layers.16.mlp.experts.152.gate_proj", "model.layers.16.mlp.experts.153.gate_proj", "model.layers.16.mlp.experts.154.gate_proj", "model.layers.16.mlp.experts.155.gate_proj", "model.layers.16.mlp.experts.156.gate_proj", "model.layers.16.mlp.experts.157.gate_proj", "model.layers.16.mlp.experts.158.gate_proj", "model.layers.16.mlp.experts.159.gate_proj", "model.layers.16.mlp.experts.0.up_proj", "model.layers.16.mlp.experts.1.up_proj", "model.layers.16.mlp.experts.2.up_proj", "model.layers.16.mlp.experts.3.up_proj", "model.layers.16.mlp.experts.4.up_proj", "model.layers.16.mlp.experts.5.up_proj", "model.layers.16.mlp.experts.6.up_proj", "model.layers.16.mlp.experts.7.up_proj", "model.layers.16.mlp.experts.8.up_proj", "model.layers.16.mlp.experts.9.up_proj", "model.layers.16.mlp.experts.10.up_proj", "model.layers.16.mlp.experts.11.up_proj", "model.layers.16.mlp.experts.12.up_proj", "model.layers.16.mlp.experts.13.up_proj", "model.layers.16.mlp.experts.14.up_proj", "model.layers.16.mlp.experts.15.up_proj", "model.layers.16.mlp.experts.16.up_proj", "model.layers.16.mlp.experts.17.up_proj", "model.layers.16.mlp.experts.18.up_proj", "model.layers.16.mlp.experts.19.up_proj", "model.layers.16.mlp.experts.20.up_proj", "model.layers.16.mlp.experts.21.up_proj", "model.layers.16.mlp.experts.22.up_proj", "model.layers.16.mlp.experts.23.up_proj", "model.layers.16.mlp.experts.24.up_proj", "model.layers.16.mlp.experts.25.up_proj", "model.layers.16.mlp.experts.26.up_proj", "model.layers.16.mlp.experts.27.up_proj", "model.layers.16.mlp.experts.28.up_proj", "model.layers.16.mlp.experts.29.up_proj", "model.layers.16.mlp.experts.30.up_proj", "model.layers.16.mlp.experts.31.up_proj", "model.layers.16.mlp.experts.32.up_proj", "model.layers.16.mlp.experts.33.up_proj", "model.layers.16.mlp.experts.34.up_proj", "model.layers.16.mlp.experts.35.up_proj", "model.layers.16.mlp.experts.36.up_proj", "model.layers.16.mlp.experts.37.up_proj", "model.layers.16.mlp.experts.38.up_proj", "model.layers.16.mlp.experts.39.up_proj", "model.layers.16.mlp.experts.40.up_proj", "model.layers.16.mlp.experts.41.up_proj", "model.layers.16.mlp.experts.42.up_proj", "model.layers.16.mlp.experts.43.up_proj", "model.layers.16.mlp.experts.44.up_proj", "model.layers.16.mlp.experts.45.up_proj", "model.layers.16.mlp.experts.46.up_proj", "model.layers.16.mlp.experts.47.up_proj", "model.layers.16.mlp.experts.48.up_proj", "model.layers.16.mlp.experts.49.up_proj", "model.layers.16.mlp.experts.50.up_proj", "model.layers.16.mlp.experts.51.up_proj", "model.layers.16.mlp.experts.52.up_proj", "model.layers.16.mlp.experts.53.up_proj", "model.layers.16.mlp.experts.54.up_proj", "model.layers.16.mlp.experts.55.up_proj", "model.layers.16.mlp.experts.56.up_proj", "model.layers.16.mlp.experts.57.up_proj", "model.layers.16.mlp.experts.58.up_proj", "model.layers.16.mlp.experts.59.up_proj", "model.layers.16.mlp.experts.60.up_proj", "model.layers.16.mlp.experts.61.up_proj", "model.layers.16.mlp.experts.62.up_proj", "model.layers.16.mlp.experts.63.up_proj", "model.layers.16.mlp.experts.64.up_proj", "model.layers.16.mlp.experts.65.up_proj", "model.layers.16.mlp.experts.66.up_proj", "model.layers.16.mlp.experts.67.up_proj", "model.layers.16.mlp.experts.68.up_proj", "model.layers.16.mlp.experts.69.up_proj", "model.layers.16.mlp.experts.70.up_proj", "model.layers.16.mlp.experts.71.up_proj", "model.layers.16.mlp.experts.72.up_proj", "model.layers.16.mlp.experts.73.up_proj", "model.layers.16.mlp.experts.74.up_proj", "model.layers.16.mlp.experts.75.up_proj", "model.layers.16.mlp.experts.76.up_proj", "model.layers.16.mlp.experts.77.up_proj", "model.layers.16.mlp.experts.78.up_proj", "model.layers.16.mlp.experts.79.up_proj", "model.layers.16.mlp.experts.80.up_proj", "model.layers.16.mlp.experts.81.up_proj", "model.layers.16.mlp.experts.82.up_proj", "model.layers.16.mlp.experts.83.up_proj", "model.layers.16.mlp.experts.84.up_proj", "model.layers.16.mlp.experts.85.up_proj", "model.layers.16.mlp.experts.86.up_proj", "model.layers.16.mlp.experts.87.up_proj", "model.layers.16.mlp.experts.88.up_proj", "model.layers.16.mlp.experts.89.up_proj", "model.layers.16.mlp.experts.90.up_proj", "model.layers.16.mlp.experts.91.up_proj", "model.layers.16.mlp.experts.92.up_proj", "model.layers.16.mlp.experts.93.up_proj", "model.layers.16.mlp.experts.94.up_proj", "model.layers.16.mlp.experts.95.up_proj", "model.layers.16.mlp.experts.96.up_proj", "model.layers.16.mlp.experts.97.up_proj", "model.layers.16.mlp.experts.98.up_proj", "model.layers.16.mlp.experts.99.up_proj", "model.layers.16.mlp.experts.100.up_proj", "model.layers.16.mlp.experts.101.up_proj", "model.layers.16.mlp.experts.102.up_proj", "model.layers.16.mlp.experts.103.up_proj", "model.layers.16.mlp.experts.104.up_proj", "model.layers.16.mlp.experts.105.up_proj", "model.layers.16.mlp.experts.106.up_proj", "model.layers.16.mlp.experts.107.up_proj", "model.layers.16.mlp.experts.108.up_proj", "model.layers.16.mlp.experts.109.up_proj", "model.layers.16.mlp.experts.110.up_proj", "model.layers.16.mlp.experts.111.up_proj", "model.layers.16.mlp.experts.112.up_proj", "model.layers.16.mlp.experts.113.up_proj", "model.layers.16.mlp.experts.114.up_proj", "model.layers.16.mlp.experts.115.up_proj", "model.layers.16.mlp.experts.116.up_proj", "model.layers.16.mlp.experts.117.up_proj", "model.layers.16.mlp.experts.118.up_proj", "model.layers.16.mlp.experts.119.up_proj", "model.layers.16.mlp.experts.120.up_proj", "model.layers.16.mlp.experts.121.up_proj", "model.layers.16.mlp.experts.122.up_proj", "model.layers.16.mlp.experts.123.up_proj", "model.layers.16.mlp.experts.124.up_proj", "model.layers.16.mlp.experts.125.up_proj", "model.layers.16.mlp.experts.126.up_proj", "model.layers.16.mlp.experts.127.up_proj", "model.layers.16.mlp.experts.128.up_proj", "model.layers.16.mlp.experts.129.up_proj", "model.layers.16.mlp.experts.130.up_proj", "model.layers.16.mlp.experts.131.up_proj", "model.layers.16.mlp.experts.132.up_proj", "model.layers.16.mlp.experts.133.up_proj", "model.layers.16.mlp.experts.134.up_proj", "model.layers.16.mlp.experts.135.up_proj", "model.layers.16.mlp.experts.136.up_proj", "model.layers.16.mlp.experts.137.up_proj", "model.layers.16.mlp.experts.138.up_proj", "model.layers.16.mlp.experts.139.up_proj", "model.layers.16.mlp.experts.140.up_proj", "model.layers.16.mlp.experts.141.up_proj", "model.layers.16.mlp.experts.142.up_proj", "model.layers.16.mlp.experts.143.up_proj", "model.layers.16.mlp.experts.144.up_proj", "model.layers.16.mlp.experts.145.up_proj", "model.layers.16.mlp.experts.146.up_proj", "model.layers.16.mlp.experts.147.up_proj", "model.layers.16.mlp.experts.148.up_proj", "model.layers.16.mlp.experts.149.up_proj", "model.layers.16.mlp.experts.150.up_proj", "model.layers.16.mlp.experts.151.up_proj", "model.layers.16.mlp.experts.152.up_proj", "model.layers.16.mlp.experts.153.up_proj", "model.layers.16.mlp.experts.154.up_proj", "model.layers.16.mlp.experts.155.up_proj", "model.layers.16.mlp.experts.156.up_proj", "model.layers.16.mlp.experts.157.up_proj", "model.layers.16.mlp.experts.158.up_proj", "model.layers.16.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -0.00018031278159469366, "dbits": 2516582400 }, { "dkld": -0.00019310102798044543, "dbits": 5033164800 } ] }, { "idx": 98, "layers": [ "model.layers.16.mlp.experts.0.down_proj", "model.layers.16.mlp.experts.1.down_proj", "model.layers.16.mlp.experts.2.down_proj", "model.layers.16.mlp.experts.3.down_proj", "model.layers.16.mlp.experts.4.down_proj", "model.layers.16.mlp.experts.5.down_proj", "model.layers.16.mlp.experts.6.down_proj", "model.layers.16.mlp.experts.7.down_proj", "model.layers.16.mlp.experts.8.down_proj", "model.layers.16.mlp.experts.9.down_proj", "model.layers.16.mlp.experts.10.down_proj", "model.layers.16.mlp.experts.11.down_proj", "model.layers.16.mlp.experts.12.down_proj", "model.layers.16.mlp.experts.13.down_proj", "model.layers.16.mlp.experts.14.down_proj", "model.layers.16.mlp.experts.15.down_proj", "model.layers.16.mlp.experts.16.down_proj", "model.layers.16.mlp.experts.17.down_proj", "model.layers.16.mlp.experts.18.down_proj", "model.layers.16.mlp.experts.19.down_proj", "model.layers.16.mlp.experts.20.down_proj", "model.layers.16.mlp.experts.21.down_proj", "model.layers.16.mlp.experts.22.down_proj", "model.layers.16.mlp.experts.23.down_proj", "model.layers.16.mlp.experts.24.down_proj", "model.layers.16.mlp.experts.25.down_proj", "model.layers.16.mlp.experts.26.down_proj", "model.layers.16.mlp.experts.27.down_proj", "model.layers.16.mlp.experts.28.down_proj", "model.layers.16.mlp.experts.29.down_proj", "model.layers.16.mlp.experts.30.down_proj", "model.layers.16.mlp.experts.31.down_proj", "model.layers.16.mlp.experts.32.down_proj", "model.layers.16.mlp.experts.33.down_proj", "model.layers.16.mlp.experts.34.down_proj", "model.layers.16.mlp.experts.35.down_proj", "model.layers.16.mlp.experts.36.down_proj", "model.layers.16.mlp.experts.37.down_proj", "model.layers.16.mlp.experts.38.down_proj", "model.layers.16.mlp.experts.39.down_proj", "model.layers.16.mlp.experts.40.down_proj", "model.layers.16.mlp.experts.41.down_proj", "model.layers.16.mlp.experts.42.down_proj", "model.layers.16.mlp.experts.43.down_proj", "model.layers.16.mlp.experts.44.down_proj", "model.layers.16.mlp.experts.45.down_proj", "model.layers.16.mlp.experts.46.down_proj", "model.layers.16.mlp.experts.47.down_proj", "model.layers.16.mlp.experts.48.down_proj", "model.layers.16.mlp.experts.49.down_proj", "model.layers.16.mlp.experts.50.down_proj", "model.layers.16.mlp.experts.51.down_proj", "model.layers.16.mlp.experts.52.down_proj", "model.layers.16.mlp.experts.53.down_proj", "model.layers.16.mlp.experts.54.down_proj", "model.layers.16.mlp.experts.55.down_proj", "model.layers.16.mlp.experts.56.down_proj", "model.layers.16.mlp.experts.57.down_proj", "model.layers.16.mlp.experts.58.down_proj", "model.layers.16.mlp.experts.59.down_proj", "model.layers.16.mlp.experts.60.down_proj", "model.layers.16.mlp.experts.61.down_proj", "model.layers.16.mlp.experts.62.down_proj", "model.layers.16.mlp.experts.63.down_proj", "model.layers.16.mlp.experts.64.down_proj", "model.layers.16.mlp.experts.65.down_proj", "model.layers.16.mlp.experts.66.down_proj", "model.layers.16.mlp.experts.67.down_proj", "model.layers.16.mlp.experts.68.down_proj", "model.layers.16.mlp.experts.69.down_proj", "model.layers.16.mlp.experts.70.down_proj", "model.layers.16.mlp.experts.71.down_proj", "model.layers.16.mlp.experts.72.down_proj", "model.layers.16.mlp.experts.73.down_proj", "model.layers.16.mlp.experts.74.down_proj", "model.layers.16.mlp.experts.75.down_proj", "model.layers.16.mlp.experts.76.down_proj", "model.layers.16.mlp.experts.77.down_proj", "model.layers.16.mlp.experts.78.down_proj", "model.layers.16.mlp.experts.79.down_proj", "model.layers.16.mlp.experts.80.down_proj", "model.layers.16.mlp.experts.81.down_proj", "model.layers.16.mlp.experts.82.down_proj", "model.layers.16.mlp.experts.83.down_proj", "model.layers.16.mlp.experts.84.down_proj", "model.layers.16.mlp.experts.85.down_proj", "model.layers.16.mlp.experts.86.down_proj", "model.layers.16.mlp.experts.87.down_proj", "model.layers.16.mlp.experts.88.down_proj", "model.layers.16.mlp.experts.89.down_proj", "model.layers.16.mlp.experts.90.down_proj", "model.layers.16.mlp.experts.91.down_proj", "model.layers.16.mlp.experts.92.down_proj", "model.layers.16.mlp.experts.93.down_proj", "model.layers.16.mlp.experts.94.down_proj", "model.layers.16.mlp.experts.95.down_proj", "model.layers.16.mlp.experts.96.down_proj", "model.layers.16.mlp.experts.97.down_proj", "model.layers.16.mlp.experts.98.down_proj", "model.layers.16.mlp.experts.99.down_proj", "model.layers.16.mlp.experts.100.down_proj", "model.layers.16.mlp.experts.101.down_proj", "model.layers.16.mlp.experts.102.down_proj", "model.layers.16.mlp.experts.103.down_proj", "model.layers.16.mlp.experts.104.down_proj", "model.layers.16.mlp.experts.105.down_proj", "model.layers.16.mlp.experts.106.down_proj", "model.layers.16.mlp.experts.107.down_proj", "model.layers.16.mlp.experts.108.down_proj", "model.layers.16.mlp.experts.109.down_proj", "model.layers.16.mlp.experts.110.down_proj", "model.layers.16.mlp.experts.111.down_proj", "model.layers.16.mlp.experts.112.down_proj", "model.layers.16.mlp.experts.113.down_proj", "model.layers.16.mlp.experts.114.down_proj", "model.layers.16.mlp.experts.115.down_proj", "model.layers.16.mlp.experts.116.down_proj", "model.layers.16.mlp.experts.117.down_proj", "model.layers.16.mlp.experts.118.down_proj", "model.layers.16.mlp.experts.119.down_proj", "model.layers.16.mlp.experts.120.down_proj", "model.layers.16.mlp.experts.121.down_proj", "model.layers.16.mlp.experts.122.down_proj", "model.layers.16.mlp.experts.123.down_proj", "model.layers.16.mlp.experts.124.down_proj", "model.layers.16.mlp.experts.125.down_proj", "model.layers.16.mlp.experts.126.down_proj", "model.layers.16.mlp.experts.127.down_proj", "model.layers.16.mlp.experts.128.down_proj", "model.layers.16.mlp.experts.129.down_proj", "model.layers.16.mlp.experts.130.down_proj", "model.layers.16.mlp.experts.131.down_proj", "model.layers.16.mlp.experts.132.down_proj", "model.layers.16.mlp.experts.133.down_proj", "model.layers.16.mlp.experts.134.down_proj", "model.layers.16.mlp.experts.135.down_proj", "model.layers.16.mlp.experts.136.down_proj", "model.layers.16.mlp.experts.137.down_proj", "model.layers.16.mlp.experts.138.down_proj", "model.layers.16.mlp.experts.139.down_proj", "model.layers.16.mlp.experts.140.down_proj", "model.layers.16.mlp.experts.141.down_proj", "model.layers.16.mlp.experts.142.down_proj", "model.layers.16.mlp.experts.143.down_proj", "model.layers.16.mlp.experts.144.down_proj", "model.layers.16.mlp.experts.145.down_proj", "model.layers.16.mlp.experts.146.down_proj", "model.layers.16.mlp.experts.147.down_proj", "model.layers.16.mlp.experts.148.down_proj", "model.layers.16.mlp.experts.149.down_proj", "model.layers.16.mlp.experts.150.down_proj", "model.layers.16.mlp.experts.151.down_proj", "model.layers.16.mlp.experts.152.down_proj", "model.layers.16.mlp.experts.153.down_proj", "model.layers.16.mlp.experts.154.down_proj", "model.layers.16.mlp.experts.155.down_proj", "model.layers.16.mlp.experts.156.down_proj", "model.layers.16.mlp.experts.157.down_proj", "model.layers.16.mlp.experts.158.down_proj", "model.layers.16.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -0.00015621578786522046, "dbits": 1258291200 }, { "dkld": -0.00010700577404349973, "dbits": 2516582400 } ] }, { "idx": 99, "layers": [ "model.layers.17.self_attn.q_proj" ], "candidates": [ { "dkld": -4.964151885360375e-05, "dbits": 62914560 }, { "dkld": -1.0487949475645672e-05, "dbits": 125829120 } ] }, { "idx": 100, "layers": [ "model.layers.17.self_attn.k_proj", "model.layers.17.self_attn.v_proj" ], "candidates": [ { "dkld": 5.7705212384469295e-06, "dbits": 10485760 }, { "dkld": 2.1400093100965717e-05, "dbits": 20971520 } ] }, { "idx": 101, "layers": [ "model.layers.17.self_attn.o_proj" ], "candidates": [ { "dkld": -1.9037141464650284e-05, "dbits": 62914560 }, { "dkld": -3.849074710160494e-05, "dbits": 125829120 } ] }, { "idx": 102, "layers": [ "model.layers.17.mlp.shared_experts.gate_proj", "model.layers.17.mlp.shared_experts.up_proj", "model.layers.17.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -6.011275108903577e-05, "dbits": 23592960 }, { "dkld": -9.572696872055426e-05, "dbits": 47185920 } ] }, { "idx": 103, "layers": [ "model.layers.17.mlp.experts.0.gate_proj", "model.layers.17.mlp.experts.1.gate_proj", "model.layers.17.mlp.experts.2.gate_proj", "model.layers.17.mlp.experts.3.gate_proj", "model.layers.17.mlp.experts.4.gate_proj", "model.layers.17.mlp.experts.5.gate_proj", "model.layers.17.mlp.experts.6.gate_proj", "model.layers.17.mlp.experts.7.gate_proj", "model.layers.17.mlp.experts.8.gate_proj", "model.layers.17.mlp.experts.9.gate_proj", "model.layers.17.mlp.experts.10.gate_proj", "model.layers.17.mlp.experts.11.gate_proj", "model.layers.17.mlp.experts.12.gate_proj", "model.layers.17.mlp.experts.13.gate_proj", "model.layers.17.mlp.experts.14.gate_proj", "model.layers.17.mlp.experts.15.gate_proj", "model.layers.17.mlp.experts.16.gate_proj", "model.layers.17.mlp.experts.17.gate_proj", "model.layers.17.mlp.experts.18.gate_proj", "model.layers.17.mlp.experts.19.gate_proj", "model.layers.17.mlp.experts.20.gate_proj", "model.layers.17.mlp.experts.21.gate_proj", "model.layers.17.mlp.experts.22.gate_proj", "model.layers.17.mlp.experts.23.gate_proj", "model.layers.17.mlp.experts.24.gate_proj", "model.layers.17.mlp.experts.25.gate_proj", "model.layers.17.mlp.experts.26.gate_proj", "model.layers.17.mlp.experts.27.gate_proj", "model.layers.17.mlp.experts.28.gate_proj", "model.layers.17.mlp.experts.29.gate_proj", "model.layers.17.mlp.experts.30.gate_proj", "model.layers.17.mlp.experts.31.gate_proj", "model.layers.17.mlp.experts.32.gate_proj", "model.layers.17.mlp.experts.33.gate_proj", "model.layers.17.mlp.experts.34.gate_proj", "model.layers.17.mlp.experts.35.gate_proj", "model.layers.17.mlp.experts.36.gate_proj", "model.layers.17.mlp.experts.37.gate_proj", "model.layers.17.mlp.experts.38.gate_proj", "model.layers.17.mlp.experts.39.gate_proj", "model.layers.17.mlp.experts.40.gate_proj", "model.layers.17.mlp.experts.41.gate_proj", "model.layers.17.mlp.experts.42.gate_proj", "model.layers.17.mlp.experts.43.gate_proj", "model.layers.17.mlp.experts.44.gate_proj", "model.layers.17.mlp.experts.45.gate_proj", "model.layers.17.mlp.experts.46.gate_proj", "model.layers.17.mlp.experts.47.gate_proj", "model.layers.17.mlp.experts.48.gate_proj", "model.layers.17.mlp.experts.49.gate_proj", "model.layers.17.mlp.experts.50.gate_proj", "model.layers.17.mlp.experts.51.gate_proj", "model.layers.17.mlp.experts.52.gate_proj", "model.layers.17.mlp.experts.53.gate_proj", "model.layers.17.mlp.experts.54.gate_proj", "model.layers.17.mlp.experts.55.gate_proj", "model.layers.17.mlp.experts.56.gate_proj", "model.layers.17.mlp.experts.57.gate_proj", "model.layers.17.mlp.experts.58.gate_proj", "model.layers.17.mlp.experts.59.gate_proj", "model.layers.17.mlp.experts.60.gate_proj", "model.layers.17.mlp.experts.61.gate_proj", "model.layers.17.mlp.experts.62.gate_proj", "model.layers.17.mlp.experts.63.gate_proj", "model.layers.17.mlp.experts.64.gate_proj", "model.layers.17.mlp.experts.65.gate_proj", "model.layers.17.mlp.experts.66.gate_proj", "model.layers.17.mlp.experts.67.gate_proj", "model.layers.17.mlp.experts.68.gate_proj", "model.layers.17.mlp.experts.69.gate_proj", "model.layers.17.mlp.experts.70.gate_proj", "model.layers.17.mlp.experts.71.gate_proj", "model.layers.17.mlp.experts.72.gate_proj", "model.layers.17.mlp.experts.73.gate_proj", "model.layers.17.mlp.experts.74.gate_proj", "model.layers.17.mlp.experts.75.gate_proj", "model.layers.17.mlp.experts.76.gate_proj", "model.layers.17.mlp.experts.77.gate_proj", "model.layers.17.mlp.experts.78.gate_proj", "model.layers.17.mlp.experts.79.gate_proj", "model.layers.17.mlp.experts.80.gate_proj", "model.layers.17.mlp.experts.81.gate_proj", "model.layers.17.mlp.experts.82.gate_proj", "model.layers.17.mlp.experts.83.gate_proj", "model.layers.17.mlp.experts.84.gate_proj", "model.layers.17.mlp.experts.85.gate_proj", "model.layers.17.mlp.experts.86.gate_proj", "model.layers.17.mlp.experts.87.gate_proj", "model.layers.17.mlp.experts.88.gate_proj", "model.layers.17.mlp.experts.89.gate_proj", "model.layers.17.mlp.experts.90.gate_proj", "model.layers.17.mlp.experts.91.gate_proj", "model.layers.17.mlp.experts.92.gate_proj", "model.layers.17.mlp.experts.93.gate_proj", "model.layers.17.mlp.experts.94.gate_proj", "model.layers.17.mlp.experts.95.gate_proj", "model.layers.17.mlp.experts.96.gate_proj", "model.layers.17.mlp.experts.97.gate_proj", "model.layers.17.mlp.experts.98.gate_proj", "model.layers.17.mlp.experts.99.gate_proj", "model.layers.17.mlp.experts.100.gate_proj", "model.layers.17.mlp.experts.101.gate_proj", "model.layers.17.mlp.experts.102.gate_proj", "model.layers.17.mlp.experts.103.gate_proj", "model.layers.17.mlp.experts.104.gate_proj", "model.layers.17.mlp.experts.105.gate_proj", "model.layers.17.mlp.experts.106.gate_proj", "model.layers.17.mlp.experts.107.gate_proj", "model.layers.17.mlp.experts.108.gate_proj", "model.layers.17.mlp.experts.109.gate_proj", "model.layers.17.mlp.experts.110.gate_proj", "model.layers.17.mlp.experts.111.gate_proj", "model.layers.17.mlp.experts.112.gate_proj", "model.layers.17.mlp.experts.113.gate_proj", "model.layers.17.mlp.experts.114.gate_proj", "model.layers.17.mlp.experts.115.gate_proj", "model.layers.17.mlp.experts.116.gate_proj", "model.layers.17.mlp.experts.117.gate_proj", "model.layers.17.mlp.experts.118.gate_proj", "model.layers.17.mlp.experts.119.gate_proj", "model.layers.17.mlp.experts.120.gate_proj", "model.layers.17.mlp.experts.121.gate_proj", "model.layers.17.mlp.experts.122.gate_proj", "model.layers.17.mlp.experts.123.gate_proj", "model.layers.17.mlp.experts.124.gate_proj", "model.layers.17.mlp.experts.125.gate_proj", "model.layers.17.mlp.experts.126.gate_proj", "model.layers.17.mlp.experts.127.gate_proj", "model.layers.17.mlp.experts.128.gate_proj", "model.layers.17.mlp.experts.129.gate_proj", "model.layers.17.mlp.experts.130.gate_proj", "model.layers.17.mlp.experts.131.gate_proj", "model.layers.17.mlp.experts.132.gate_proj", "model.layers.17.mlp.experts.133.gate_proj", "model.layers.17.mlp.experts.134.gate_proj", "model.layers.17.mlp.experts.135.gate_proj", "model.layers.17.mlp.experts.136.gate_proj", "model.layers.17.mlp.experts.137.gate_proj", "model.layers.17.mlp.experts.138.gate_proj", "model.layers.17.mlp.experts.139.gate_proj", "model.layers.17.mlp.experts.140.gate_proj", "model.layers.17.mlp.experts.141.gate_proj", "model.layers.17.mlp.experts.142.gate_proj", "model.layers.17.mlp.experts.143.gate_proj", "model.layers.17.mlp.experts.144.gate_proj", "model.layers.17.mlp.experts.145.gate_proj", "model.layers.17.mlp.experts.146.gate_proj", "model.layers.17.mlp.experts.147.gate_proj", "model.layers.17.mlp.experts.148.gate_proj", "model.layers.17.mlp.experts.149.gate_proj", "model.layers.17.mlp.experts.150.gate_proj", "model.layers.17.mlp.experts.151.gate_proj", "model.layers.17.mlp.experts.152.gate_proj", "model.layers.17.mlp.experts.153.gate_proj", "model.layers.17.mlp.experts.154.gate_proj", "model.layers.17.mlp.experts.155.gate_proj", "model.layers.17.mlp.experts.156.gate_proj", "model.layers.17.mlp.experts.157.gate_proj", "model.layers.17.mlp.experts.158.gate_proj", "model.layers.17.mlp.experts.159.gate_proj", "model.layers.17.mlp.experts.0.up_proj", "model.layers.17.mlp.experts.1.up_proj", "model.layers.17.mlp.experts.2.up_proj", "model.layers.17.mlp.experts.3.up_proj", "model.layers.17.mlp.experts.4.up_proj", "model.layers.17.mlp.experts.5.up_proj", "model.layers.17.mlp.experts.6.up_proj", "model.layers.17.mlp.experts.7.up_proj", "model.layers.17.mlp.experts.8.up_proj", "model.layers.17.mlp.experts.9.up_proj", "model.layers.17.mlp.experts.10.up_proj", "model.layers.17.mlp.experts.11.up_proj", "model.layers.17.mlp.experts.12.up_proj", "model.layers.17.mlp.experts.13.up_proj", "model.layers.17.mlp.experts.14.up_proj", "model.layers.17.mlp.experts.15.up_proj", "model.layers.17.mlp.experts.16.up_proj", "model.layers.17.mlp.experts.17.up_proj", "model.layers.17.mlp.experts.18.up_proj", "model.layers.17.mlp.experts.19.up_proj", "model.layers.17.mlp.experts.20.up_proj", "model.layers.17.mlp.experts.21.up_proj", "model.layers.17.mlp.experts.22.up_proj", "model.layers.17.mlp.experts.23.up_proj", "model.layers.17.mlp.experts.24.up_proj", "model.layers.17.mlp.experts.25.up_proj", "model.layers.17.mlp.experts.26.up_proj", "model.layers.17.mlp.experts.27.up_proj", "model.layers.17.mlp.experts.28.up_proj", "model.layers.17.mlp.experts.29.up_proj", "model.layers.17.mlp.experts.30.up_proj", "model.layers.17.mlp.experts.31.up_proj", "model.layers.17.mlp.experts.32.up_proj", "model.layers.17.mlp.experts.33.up_proj", "model.layers.17.mlp.experts.34.up_proj", "model.layers.17.mlp.experts.35.up_proj", "model.layers.17.mlp.experts.36.up_proj", "model.layers.17.mlp.experts.37.up_proj", "model.layers.17.mlp.experts.38.up_proj", "model.layers.17.mlp.experts.39.up_proj", "model.layers.17.mlp.experts.40.up_proj", "model.layers.17.mlp.experts.41.up_proj", "model.layers.17.mlp.experts.42.up_proj", "model.layers.17.mlp.experts.43.up_proj", "model.layers.17.mlp.experts.44.up_proj", "model.layers.17.mlp.experts.45.up_proj", "model.layers.17.mlp.experts.46.up_proj", "model.layers.17.mlp.experts.47.up_proj", "model.layers.17.mlp.experts.48.up_proj", "model.layers.17.mlp.experts.49.up_proj", "model.layers.17.mlp.experts.50.up_proj", "model.layers.17.mlp.experts.51.up_proj", "model.layers.17.mlp.experts.52.up_proj", "model.layers.17.mlp.experts.53.up_proj", "model.layers.17.mlp.experts.54.up_proj", "model.layers.17.mlp.experts.55.up_proj", "model.layers.17.mlp.experts.56.up_proj", "model.layers.17.mlp.experts.57.up_proj", "model.layers.17.mlp.experts.58.up_proj", "model.layers.17.mlp.experts.59.up_proj", "model.layers.17.mlp.experts.60.up_proj", "model.layers.17.mlp.experts.61.up_proj", "model.layers.17.mlp.experts.62.up_proj", "model.layers.17.mlp.experts.63.up_proj", "model.layers.17.mlp.experts.64.up_proj", "model.layers.17.mlp.experts.65.up_proj", "model.layers.17.mlp.experts.66.up_proj", "model.layers.17.mlp.experts.67.up_proj", "model.layers.17.mlp.experts.68.up_proj", "model.layers.17.mlp.experts.69.up_proj", "model.layers.17.mlp.experts.70.up_proj", "model.layers.17.mlp.experts.71.up_proj", "model.layers.17.mlp.experts.72.up_proj", "model.layers.17.mlp.experts.73.up_proj", "model.layers.17.mlp.experts.74.up_proj", "model.layers.17.mlp.experts.75.up_proj", "model.layers.17.mlp.experts.76.up_proj", "model.layers.17.mlp.experts.77.up_proj", "model.layers.17.mlp.experts.78.up_proj", "model.layers.17.mlp.experts.79.up_proj", "model.layers.17.mlp.experts.80.up_proj", "model.layers.17.mlp.experts.81.up_proj", "model.layers.17.mlp.experts.82.up_proj", "model.layers.17.mlp.experts.83.up_proj", "model.layers.17.mlp.experts.84.up_proj", "model.layers.17.mlp.experts.85.up_proj", "model.layers.17.mlp.experts.86.up_proj", "model.layers.17.mlp.experts.87.up_proj", "model.layers.17.mlp.experts.88.up_proj", "model.layers.17.mlp.experts.89.up_proj", "model.layers.17.mlp.experts.90.up_proj", "model.layers.17.mlp.experts.91.up_proj", "model.layers.17.mlp.experts.92.up_proj", "model.layers.17.mlp.experts.93.up_proj", "model.layers.17.mlp.experts.94.up_proj", "model.layers.17.mlp.experts.95.up_proj", "model.layers.17.mlp.experts.96.up_proj", "model.layers.17.mlp.experts.97.up_proj", "model.layers.17.mlp.experts.98.up_proj", "model.layers.17.mlp.experts.99.up_proj", "model.layers.17.mlp.experts.100.up_proj", "model.layers.17.mlp.experts.101.up_proj", "model.layers.17.mlp.experts.102.up_proj", "model.layers.17.mlp.experts.103.up_proj", "model.layers.17.mlp.experts.104.up_proj", "model.layers.17.mlp.experts.105.up_proj", "model.layers.17.mlp.experts.106.up_proj", "model.layers.17.mlp.experts.107.up_proj", "model.layers.17.mlp.experts.108.up_proj", "model.layers.17.mlp.experts.109.up_proj", "model.layers.17.mlp.experts.110.up_proj", "model.layers.17.mlp.experts.111.up_proj", "model.layers.17.mlp.experts.112.up_proj", "model.layers.17.mlp.experts.113.up_proj", "model.layers.17.mlp.experts.114.up_proj", "model.layers.17.mlp.experts.115.up_proj", "model.layers.17.mlp.experts.116.up_proj", "model.layers.17.mlp.experts.117.up_proj", "model.layers.17.mlp.experts.118.up_proj", "model.layers.17.mlp.experts.119.up_proj", "model.layers.17.mlp.experts.120.up_proj", "model.layers.17.mlp.experts.121.up_proj", "model.layers.17.mlp.experts.122.up_proj", "model.layers.17.mlp.experts.123.up_proj", "model.layers.17.mlp.experts.124.up_proj", "model.layers.17.mlp.experts.125.up_proj", "model.layers.17.mlp.experts.126.up_proj", "model.layers.17.mlp.experts.127.up_proj", "model.layers.17.mlp.experts.128.up_proj", "model.layers.17.mlp.experts.129.up_proj", "model.layers.17.mlp.experts.130.up_proj", "model.layers.17.mlp.experts.131.up_proj", "model.layers.17.mlp.experts.132.up_proj", "model.layers.17.mlp.experts.133.up_proj", "model.layers.17.mlp.experts.134.up_proj", "model.layers.17.mlp.experts.135.up_proj", "model.layers.17.mlp.experts.136.up_proj", "model.layers.17.mlp.experts.137.up_proj", "model.layers.17.mlp.experts.138.up_proj", "model.layers.17.mlp.experts.139.up_proj", "model.layers.17.mlp.experts.140.up_proj", "model.layers.17.mlp.experts.141.up_proj", "model.layers.17.mlp.experts.142.up_proj", "model.layers.17.mlp.experts.143.up_proj", "model.layers.17.mlp.experts.144.up_proj", "model.layers.17.mlp.experts.145.up_proj", "model.layers.17.mlp.experts.146.up_proj", "model.layers.17.mlp.experts.147.up_proj", "model.layers.17.mlp.experts.148.up_proj", "model.layers.17.mlp.experts.149.up_proj", "model.layers.17.mlp.experts.150.up_proj", "model.layers.17.mlp.experts.151.up_proj", "model.layers.17.mlp.experts.152.up_proj", "model.layers.17.mlp.experts.153.up_proj", "model.layers.17.mlp.experts.154.up_proj", "model.layers.17.mlp.experts.155.up_proj", "model.layers.17.mlp.experts.156.up_proj", "model.layers.17.mlp.experts.157.up_proj", "model.layers.17.mlp.experts.158.up_proj", "model.layers.17.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -8.643660694360698e-05, "dbits": 2516582400 }, { "dkld": -0.00010066998656839063, "dbits": 5033164800 } ] }, { "idx": 104, "layers": [ "model.layers.17.mlp.experts.0.down_proj", "model.layers.17.mlp.experts.1.down_proj", "model.layers.17.mlp.experts.2.down_proj", "model.layers.17.mlp.experts.3.down_proj", "model.layers.17.mlp.experts.4.down_proj", "model.layers.17.mlp.experts.5.down_proj", "model.layers.17.mlp.experts.6.down_proj", "model.layers.17.mlp.experts.7.down_proj", "model.layers.17.mlp.experts.8.down_proj", "model.layers.17.mlp.experts.9.down_proj", "model.layers.17.mlp.experts.10.down_proj", "model.layers.17.mlp.experts.11.down_proj", "model.layers.17.mlp.experts.12.down_proj", "model.layers.17.mlp.experts.13.down_proj", "model.layers.17.mlp.experts.14.down_proj", "model.layers.17.mlp.experts.15.down_proj", "model.layers.17.mlp.experts.16.down_proj", "model.layers.17.mlp.experts.17.down_proj", "model.layers.17.mlp.experts.18.down_proj", "model.layers.17.mlp.experts.19.down_proj", "model.layers.17.mlp.experts.20.down_proj", "model.layers.17.mlp.experts.21.down_proj", "model.layers.17.mlp.experts.22.down_proj", "model.layers.17.mlp.experts.23.down_proj", "model.layers.17.mlp.experts.24.down_proj", "model.layers.17.mlp.experts.25.down_proj", "model.layers.17.mlp.experts.26.down_proj", "model.layers.17.mlp.experts.27.down_proj", "model.layers.17.mlp.experts.28.down_proj", "model.layers.17.mlp.experts.29.down_proj", "model.layers.17.mlp.experts.30.down_proj", "model.layers.17.mlp.experts.31.down_proj", "model.layers.17.mlp.experts.32.down_proj", "model.layers.17.mlp.experts.33.down_proj", "model.layers.17.mlp.experts.34.down_proj", "model.layers.17.mlp.experts.35.down_proj", "model.layers.17.mlp.experts.36.down_proj", "model.layers.17.mlp.experts.37.down_proj", "model.layers.17.mlp.experts.38.down_proj", "model.layers.17.mlp.experts.39.down_proj", "model.layers.17.mlp.experts.40.down_proj", "model.layers.17.mlp.experts.41.down_proj", "model.layers.17.mlp.experts.42.down_proj", "model.layers.17.mlp.experts.43.down_proj", "model.layers.17.mlp.experts.44.down_proj", "model.layers.17.mlp.experts.45.down_proj", "model.layers.17.mlp.experts.46.down_proj", "model.layers.17.mlp.experts.47.down_proj", "model.layers.17.mlp.experts.48.down_proj", "model.layers.17.mlp.experts.49.down_proj", "model.layers.17.mlp.experts.50.down_proj", "model.layers.17.mlp.experts.51.down_proj", "model.layers.17.mlp.experts.52.down_proj", "model.layers.17.mlp.experts.53.down_proj", "model.layers.17.mlp.experts.54.down_proj", "model.layers.17.mlp.experts.55.down_proj", "model.layers.17.mlp.experts.56.down_proj", "model.layers.17.mlp.experts.57.down_proj", "model.layers.17.mlp.experts.58.down_proj", "model.layers.17.mlp.experts.59.down_proj", "model.layers.17.mlp.experts.60.down_proj", "model.layers.17.mlp.experts.61.down_proj", "model.layers.17.mlp.experts.62.down_proj", "model.layers.17.mlp.experts.63.down_proj", "model.layers.17.mlp.experts.64.down_proj", "model.layers.17.mlp.experts.65.down_proj", "model.layers.17.mlp.experts.66.down_proj", "model.layers.17.mlp.experts.67.down_proj", "model.layers.17.mlp.experts.68.down_proj", "model.layers.17.mlp.experts.69.down_proj", "model.layers.17.mlp.experts.70.down_proj", "model.layers.17.mlp.experts.71.down_proj", "model.layers.17.mlp.experts.72.down_proj", "model.layers.17.mlp.experts.73.down_proj", "model.layers.17.mlp.experts.74.down_proj", "model.layers.17.mlp.experts.75.down_proj", "model.layers.17.mlp.experts.76.down_proj", "model.layers.17.mlp.experts.77.down_proj", "model.layers.17.mlp.experts.78.down_proj", "model.layers.17.mlp.experts.79.down_proj", "model.layers.17.mlp.experts.80.down_proj", "model.layers.17.mlp.experts.81.down_proj", "model.layers.17.mlp.experts.82.down_proj", "model.layers.17.mlp.experts.83.down_proj", "model.layers.17.mlp.experts.84.down_proj", "model.layers.17.mlp.experts.85.down_proj", "model.layers.17.mlp.experts.86.down_proj", "model.layers.17.mlp.experts.87.down_proj", "model.layers.17.mlp.experts.88.down_proj", "model.layers.17.mlp.experts.89.down_proj", "model.layers.17.mlp.experts.90.down_proj", "model.layers.17.mlp.experts.91.down_proj", "model.layers.17.mlp.experts.92.down_proj", "model.layers.17.mlp.experts.93.down_proj", "model.layers.17.mlp.experts.94.down_proj", "model.layers.17.mlp.experts.95.down_proj", "model.layers.17.mlp.experts.96.down_proj", "model.layers.17.mlp.experts.97.down_proj", "model.layers.17.mlp.experts.98.down_proj", "model.layers.17.mlp.experts.99.down_proj", "model.layers.17.mlp.experts.100.down_proj", "model.layers.17.mlp.experts.101.down_proj", "model.layers.17.mlp.experts.102.down_proj", "model.layers.17.mlp.experts.103.down_proj", "model.layers.17.mlp.experts.104.down_proj", "model.layers.17.mlp.experts.105.down_proj", "model.layers.17.mlp.experts.106.down_proj", "model.layers.17.mlp.experts.107.down_proj", "model.layers.17.mlp.experts.108.down_proj", "model.layers.17.mlp.experts.109.down_proj", "model.layers.17.mlp.experts.110.down_proj", "model.layers.17.mlp.experts.111.down_proj", "model.layers.17.mlp.experts.112.down_proj", "model.layers.17.mlp.experts.113.down_proj", "model.layers.17.mlp.experts.114.down_proj", "model.layers.17.mlp.experts.115.down_proj", "model.layers.17.mlp.experts.116.down_proj", "model.layers.17.mlp.experts.117.down_proj", "model.layers.17.mlp.experts.118.down_proj", "model.layers.17.mlp.experts.119.down_proj", "model.layers.17.mlp.experts.120.down_proj", "model.layers.17.mlp.experts.121.down_proj", "model.layers.17.mlp.experts.122.down_proj", "model.layers.17.mlp.experts.123.down_proj", "model.layers.17.mlp.experts.124.down_proj", "model.layers.17.mlp.experts.125.down_proj", "model.layers.17.mlp.experts.126.down_proj", "model.layers.17.mlp.experts.127.down_proj", "model.layers.17.mlp.experts.128.down_proj", "model.layers.17.mlp.experts.129.down_proj", "model.layers.17.mlp.experts.130.down_proj", "model.layers.17.mlp.experts.131.down_proj", "model.layers.17.mlp.experts.132.down_proj", "model.layers.17.mlp.experts.133.down_proj", "model.layers.17.mlp.experts.134.down_proj", "model.layers.17.mlp.experts.135.down_proj", "model.layers.17.mlp.experts.136.down_proj", "model.layers.17.mlp.experts.137.down_proj", "model.layers.17.mlp.experts.138.down_proj", "model.layers.17.mlp.experts.139.down_proj", "model.layers.17.mlp.experts.140.down_proj", "model.layers.17.mlp.experts.141.down_proj", "model.layers.17.mlp.experts.142.down_proj", "model.layers.17.mlp.experts.143.down_proj", "model.layers.17.mlp.experts.144.down_proj", "model.layers.17.mlp.experts.145.down_proj", "model.layers.17.mlp.experts.146.down_proj", "model.layers.17.mlp.experts.147.down_proj", "model.layers.17.mlp.experts.148.down_proj", "model.layers.17.mlp.experts.149.down_proj", "model.layers.17.mlp.experts.150.down_proj", "model.layers.17.mlp.experts.151.down_proj", "model.layers.17.mlp.experts.152.down_proj", "model.layers.17.mlp.experts.153.down_proj", "model.layers.17.mlp.experts.154.down_proj", "model.layers.17.mlp.experts.155.down_proj", "model.layers.17.mlp.experts.156.down_proj", "model.layers.17.mlp.experts.157.down_proj", "model.layers.17.mlp.experts.158.down_proj", "model.layers.17.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -6.390607450157404e-05, "dbits": 1258291200 }, { "dkld": -4.047134425490956e-05, "dbits": 2516582400 } ] }, { "idx": 105, "layers": [ "model.layers.18.self_attn.q_proj" ], "candidates": [ { "dkld": 0.00010677329264581308, "dbits": 62914560 }, { "dkld": 2.572159282863279e-05, "dbits": 125829120 } ] }, { "idx": 106, "layers": [ "model.layers.18.self_attn.k_proj", "model.layers.18.self_attn.v_proj" ], "candidates": [ { "dkld": 4.050047136843274e-05, "dbits": 10485760 }, { "dkld": 3.5482947714627136e-05, "dbits": 20971520 } ] }, { "idx": 107, "layers": [ "model.layers.18.self_attn.o_proj" ], "candidates": [ { "dkld": 2.6661693118512977e-05, "dbits": 62914560 }, { "dkld": -6.81598205119361e-05, "dbits": 125829120 } ] }, { "idx": 108, "layers": [ "model.layers.18.mlp.shared_experts.gate_proj", "model.layers.18.mlp.shared_experts.up_proj", "model.layers.18.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.00024247246328741243, "dbits": 23592960 }, { "dkld": -0.0002325587207451449, "dbits": 47185920 } ] }, { "idx": 109, "layers": [ "model.layers.18.mlp.experts.0.gate_proj", "model.layers.18.mlp.experts.1.gate_proj", "model.layers.18.mlp.experts.2.gate_proj", "model.layers.18.mlp.experts.3.gate_proj", "model.layers.18.mlp.experts.4.gate_proj", "model.layers.18.mlp.experts.5.gate_proj", "model.layers.18.mlp.experts.6.gate_proj", "model.layers.18.mlp.experts.7.gate_proj", "model.layers.18.mlp.experts.8.gate_proj", "model.layers.18.mlp.experts.9.gate_proj", "model.layers.18.mlp.experts.10.gate_proj", "model.layers.18.mlp.experts.11.gate_proj", "model.layers.18.mlp.experts.12.gate_proj", "model.layers.18.mlp.experts.13.gate_proj", "model.layers.18.mlp.experts.14.gate_proj", "model.layers.18.mlp.experts.15.gate_proj", "model.layers.18.mlp.experts.16.gate_proj", "model.layers.18.mlp.experts.17.gate_proj", "model.layers.18.mlp.experts.18.gate_proj", "model.layers.18.mlp.experts.19.gate_proj", "model.layers.18.mlp.experts.20.gate_proj", "model.layers.18.mlp.experts.21.gate_proj", "model.layers.18.mlp.experts.22.gate_proj", "model.layers.18.mlp.experts.23.gate_proj", "model.layers.18.mlp.experts.24.gate_proj", "model.layers.18.mlp.experts.25.gate_proj", "model.layers.18.mlp.experts.26.gate_proj", "model.layers.18.mlp.experts.27.gate_proj", "model.layers.18.mlp.experts.28.gate_proj", "model.layers.18.mlp.experts.29.gate_proj", "model.layers.18.mlp.experts.30.gate_proj", "model.layers.18.mlp.experts.31.gate_proj", "model.layers.18.mlp.experts.32.gate_proj", "model.layers.18.mlp.experts.33.gate_proj", "model.layers.18.mlp.experts.34.gate_proj", "model.layers.18.mlp.experts.35.gate_proj", "model.layers.18.mlp.experts.36.gate_proj", "model.layers.18.mlp.experts.37.gate_proj", "model.layers.18.mlp.experts.38.gate_proj", "model.layers.18.mlp.experts.39.gate_proj", "model.layers.18.mlp.experts.40.gate_proj", "model.layers.18.mlp.experts.41.gate_proj", "model.layers.18.mlp.experts.42.gate_proj", "model.layers.18.mlp.experts.43.gate_proj", "model.layers.18.mlp.experts.44.gate_proj", "model.layers.18.mlp.experts.45.gate_proj", "model.layers.18.mlp.experts.46.gate_proj", "model.layers.18.mlp.experts.47.gate_proj", "model.layers.18.mlp.experts.48.gate_proj", "model.layers.18.mlp.experts.49.gate_proj", "model.layers.18.mlp.experts.50.gate_proj", "model.layers.18.mlp.experts.51.gate_proj", "model.layers.18.mlp.experts.52.gate_proj", "model.layers.18.mlp.experts.53.gate_proj", "model.layers.18.mlp.experts.54.gate_proj", "model.layers.18.mlp.experts.55.gate_proj", "model.layers.18.mlp.experts.56.gate_proj", "model.layers.18.mlp.experts.57.gate_proj", "model.layers.18.mlp.experts.58.gate_proj", "model.layers.18.mlp.experts.59.gate_proj", "model.layers.18.mlp.experts.60.gate_proj", "model.layers.18.mlp.experts.61.gate_proj", "model.layers.18.mlp.experts.62.gate_proj", "model.layers.18.mlp.experts.63.gate_proj", "model.layers.18.mlp.experts.64.gate_proj", "model.layers.18.mlp.experts.65.gate_proj", "model.layers.18.mlp.experts.66.gate_proj", "model.layers.18.mlp.experts.67.gate_proj", "model.layers.18.mlp.experts.68.gate_proj", "model.layers.18.mlp.experts.69.gate_proj", "model.layers.18.mlp.experts.70.gate_proj", "model.layers.18.mlp.experts.71.gate_proj", "model.layers.18.mlp.experts.72.gate_proj", "model.layers.18.mlp.experts.73.gate_proj", "model.layers.18.mlp.experts.74.gate_proj", "model.layers.18.mlp.experts.75.gate_proj", "model.layers.18.mlp.experts.76.gate_proj", "model.layers.18.mlp.experts.77.gate_proj", "model.layers.18.mlp.experts.78.gate_proj", "model.layers.18.mlp.experts.79.gate_proj", "model.layers.18.mlp.experts.80.gate_proj", "model.layers.18.mlp.experts.81.gate_proj", "model.layers.18.mlp.experts.82.gate_proj", "model.layers.18.mlp.experts.83.gate_proj", "model.layers.18.mlp.experts.84.gate_proj", "model.layers.18.mlp.experts.85.gate_proj", "model.layers.18.mlp.experts.86.gate_proj", "model.layers.18.mlp.experts.87.gate_proj", "model.layers.18.mlp.experts.88.gate_proj", "model.layers.18.mlp.experts.89.gate_proj", "model.layers.18.mlp.experts.90.gate_proj", "model.layers.18.mlp.experts.91.gate_proj", "model.layers.18.mlp.experts.92.gate_proj", "model.layers.18.mlp.experts.93.gate_proj", "model.layers.18.mlp.experts.94.gate_proj", "model.layers.18.mlp.experts.95.gate_proj", "model.layers.18.mlp.experts.96.gate_proj", "model.layers.18.mlp.experts.97.gate_proj", "model.layers.18.mlp.experts.98.gate_proj", "model.layers.18.mlp.experts.99.gate_proj", "model.layers.18.mlp.experts.100.gate_proj", "model.layers.18.mlp.experts.101.gate_proj", "model.layers.18.mlp.experts.102.gate_proj", "model.layers.18.mlp.experts.103.gate_proj", "model.layers.18.mlp.experts.104.gate_proj", "model.layers.18.mlp.experts.105.gate_proj", "model.layers.18.mlp.experts.106.gate_proj", "model.layers.18.mlp.experts.107.gate_proj", "model.layers.18.mlp.experts.108.gate_proj", "model.layers.18.mlp.experts.109.gate_proj", "model.layers.18.mlp.experts.110.gate_proj", "model.layers.18.mlp.experts.111.gate_proj", "model.layers.18.mlp.experts.112.gate_proj", "model.layers.18.mlp.experts.113.gate_proj", "model.layers.18.mlp.experts.114.gate_proj", "model.layers.18.mlp.experts.115.gate_proj", "model.layers.18.mlp.experts.116.gate_proj", "model.layers.18.mlp.experts.117.gate_proj", "model.layers.18.mlp.experts.118.gate_proj", "model.layers.18.mlp.experts.119.gate_proj", "model.layers.18.mlp.experts.120.gate_proj", "model.layers.18.mlp.experts.121.gate_proj", "model.layers.18.mlp.experts.122.gate_proj", "model.layers.18.mlp.experts.123.gate_proj", "model.layers.18.mlp.experts.124.gate_proj", "model.layers.18.mlp.experts.125.gate_proj", "model.layers.18.mlp.experts.126.gate_proj", "model.layers.18.mlp.experts.127.gate_proj", "model.layers.18.mlp.experts.128.gate_proj", "model.layers.18.mlp.experts.129.gate_proj", "model.layers.18.mlp.experts.130.gate_proj", "model.layers.18.mlp.experts.131.gate_proj", "model.layers.18.mlp.experts.132.gate_proj", "model.layers.18.mlp.experts.133.gate_proj", "model.layers.18.mlp.experts.134.gate_proj", "model.layers.18.mlp.experts.135.gate_proj", "model.layers.18.mlp.experts.136.gate_proj", "model.layers.18.mlp.experts.137.gate_proj", "model.layers.18.mlp.experts.138.gate_proj", "model.layers.18.mlp.experts.139.gate_proj", "model.layers.18.mlp.experts.140.gate_proj", "model.layers.18.mlp.experts.141.gate_proj", "model.layers.18.mlp.experts.142.gate_proj", "model.layers.18.mlp.experts.143.gate_proj", "model.layers.18.mlp.experts.144.gate_proj", "model.layers.18.mlp.experts.145.gate_proj", "model.layers.18.mlp.experts.146.gate_proj", "model.layers.18.mlp.experts.147.gate_proj", "model.layers.18.mlp.experts.148.gate_proj", "model.layers.18.mlp.experts.149.gate_proj", "model.layers.18.mlp.experts.150.gate_proj", "model.layers.18.mlp.experts.151.gate_proj", "model.layers.18.mlp.experts.152.gate_proj", "model.layers.18.mlp.experts.153.gate_proj", "model.layers.18.mlp.experts.154.gate_proj", "model.layers.18.mlp.experts.155.gate_proj", "model.layers.18.mlp.experts.156.gate_proj", "model.layers.18.mlp.experts.157.gate_proj", "model.layers.18.mlp.experts.158.gate_proj", "model.layers.18.mlp.experts.159.gate_proj", "model.layers.18.mlp.experts.0.up_proj", "model.layers.18.mlp.experts.1.up_proj", "model.layers.18.mlp.experts.2.up_proj", "model.layers.18.mlp.experts.3.up_proj", "model.layers.18.mlp.experts.4.up_proj", "model.layers.18.mlp.experts.5.up_proj", "model.layers.18.mlp.experts.6.up_proj", "model.layers.18.mlp.experts.7.up_proj", "model.layers.18.mlp.experts.8.up_proj", "model.layers.18.mlp.experts.9.up_proj", "model.layers.18.mlp.experts.10.up_proj", "model.layers.18.mlp.experts.11.up_proj", "model.layers.18.mlp.experts.12.up_proj", "model.layers.18.mlp.experts.13.up_proj", "model.layers.18.mlp.experts.14.up_proj", "model.layers.18.mlp.experts.15.up_proj", "model.layers.18.mlp.experts.16.up_proj", "model.layers.18.mlp.experts.17.up_proj", "model.layers.18.mlp.experts.18.up_proj", "model.layers.18.mlp.experts.19.up_proj", "model.layers.18.mlp.experts.20.up_proj", "model.layers.18.mlp.experts.21.up_proj", "model.layers.18.mlp.experts.22.up_proj", "model.layers.18.mlp.experts.23.up_proj", "model.layers.18.mlp.experts.24.up_proj", "model.layers.18.mlp.experts.25.up_proj", "model.layers.18.mlp.experts.26.up_proj", "model.layers.18.mlp.experts.27.up_proj", "model.layers.18.mlp.experts.28.up_proj", "model.layers.18.mlp.experts.29.up_proj", "model.layers.18.mlp.experts.30.up_proj", "model.layers.18.mlp.experts.31.up_proj", "model.layers.18.mlp.experts.32.up_proj", "model.layers.18.mlp.experts.33.up_proj", "model.layers.18.mlp.experts.34.up_proj", "model.layers.18.mlp.experts.35.up_proj", "model.layers.18.mlp.experts.36.up_proj", "model.layers.18.mlp.experts.37.up_proj", "model.layers.18.mlp.experts.38.up_proj", "model.layers.18.mlp.experts.39.up_proj", "model.layers.18.mlp.experts.40.up_proj", "model.layers.18.mlp.experts.41.up_proj", "model.layers.18.mlp.experts.42.up_proj", "model.layers.18.mlp.experts.43.up_proj", "model.layers.18.mlp.experts.44.up_proj", "model.layers.18.mlp.experts.45.up_proj", "model.layers.18.mlp.experts.46.up_proj", "model.layers.18.mlp.experts.47.up_proj", "model.layers.18.mlp.experts.48.up_proj", "model.layers.18.mlp.experts.49.up_proj", "model.layers.18.mlp.experts.50.up_proj", "model.layers.18.mlp.experts.51.up_proj", "model.layers.18.mlp.experts.52.up_proj", "model.layers.18.mlp.experts.53.up_proj", "model.layers.18.mlp.experts.54.up_proj", "model.layers.18.mlp.experts.55.up_proj", "model.layers.18.mlp.experts.56.up_proj", "model.layers.18.mlp.experts.57.up_proj", "model.layers.18.mlp.experts.58.up_proj", "model.layers.18.mlp.experts.59.up_proj", "model.layers.18.mlp.experts.60.up_proj", "model.layers.18.mlp.experts.61.up_proj", "model.layers.18.mlp.experts.62.up_proj", "model.layers.18.mlp.experts.63.up_proj", "model.layers.18.mlp.experts.64.up_proj", "model.layers.18.mlp.experts.65.up_proj", "model.layers.18.mlp.experts.66.up_proj", "model.layers.18.mlp.experts.67.up_proj", "model.layers.18.mlp.experts.68.up_proj", "model.layers.18.mlp.experts.69.up_proj", "model.layers.18.mlp.experts.70.up_proj", "model.layers.18.mlp.experts.71.up_proj", "model.layers.18.mlp.experts.72.up_proj", "model.layers.18.mlp.experts.73.up_proj", "model.layers.18.mlp.experts.74.up_proj", "model.layers.18.mlp.experts.75.up_proj", "model.layers.18.mlp.experts.76.up_proj", "model.layers.18.mlp.experts.77.up_proj", "model.layers.18.mlp.experts.78.up_proj", "model.layers.18.mlp.experts.79.up_proj", "model.layers.18.mlp.experts.80.up_proj", "model.layers.18.mlp.experts.81.up_proj", "model.layers.18.mlp.experts.82.up_proj", "model.layers.18.mlp.experts.83.up_proj", "model.layers.18.mlp.experts.84.up_proj", "model.layers.18.mlp.experts.85.up_proj", "model.layers.18.mlp.experts.86.up_proj", "model.layers.18.mlp.experts.87.up_proj", "model.layers.18.mlp.experts.88.up_proj", "model.layers.18.mlp.experts.89.up_proj", "model.layers.18.mlp.experts.90.up_proj", "model.layers.18.mlp.experts.91.up_proj", "model.layers.18.mlp.experts.92.up_proj", "model.layers.18.mlp.experts.93.up_proj", "model.layers.18.mlp.experts.94.up_proj", "model.layers.18.mlp.experts.95.up_proj", "model.layers.18.mlp.experts.96.up_proj", "model.layers.18.mlp.experts.97.up_proj", "model.layers.18.mlp.experts.98.up_proj", "model.layers.18.mlp.experts.99.up_proj", "model.layers.18.mlp.experts.100.up_proj", "model.layers.18.mlp.experts.101.up_proj", "model.layers.18.mlp.experts.102.up_proj", "model.layers.18.mlp.experts.103.up_proj", "model.layers.18.mlp.experts.104.up_proj", "model.layers.18.mlp.experts.105.up_proj", "model.layers.18.mlp.experts.106.up_proj", "model.layers.18.mlp.experts.107.up_proj", "model.layers.18.mlp.experts.108.up_proj", "model.layers.18.mlp.experts.109.up_proj", "model.layers.18.mlp.experts.110.up_proj", "model.layers.18.mlp.experts.111.up_proj", "model.layers.18.mlp.experts.112.up_proj", "model.layers.18.mlp.experts.113.up_proj", "model.layers.18.mlp.experts.114.up_proj", "model.layers.18.mlp.experts.115.up_proj", "model.layers.18.mlp.experts.116.up_proj", "model.layers.18.mlp.experts.117.up_proj", "model.layers.18.mlp.experts.118.up_proj", "model.layers.18.mlp.experts.119.up_proj", "model.layers.18.mlp.experts.120.up_proj", "model.layers.18.mlp.experts.121.up_proj", "model.layers.18.mlp.experts.122.up_proj", "model.layers.18.mlp.experts.123.up_proj", "model.layers.18.mlp.experts.124.up_proj", "model.layers.18.mlp.experts.125.up_proj", "model.layers.18.mlp.experts.126.up_proj", "model.layers.18.mlp.experts.127.up_proj", "model.layers.18.mlp.experts.128.up_proj", "model.layers.18.mlp.experts.129.up_proj", "model.layers.18.mlp.experts.130.up_proj", "model.layers.18.mlp.experts.131.up_proj", "model.layers.18.mlp.experts.132.up_proj", "model.layers.18.mlp.experts.133.up_proj", "model.layers.18.mlp.experts.134.up_proj", "model.layers.18.mlp.experts.135.up_proj", "model.layers.18.mlp.experts.136.up_proj", "model.layers.18.mlp.experts.137.up_proj", "model.layers.18.mlp.experts.138.up_proj", "model.layers.18.mlp.experts.139.up_proj", "model.layers.18.mlp.experts.140.up_proj", "model.layers.18.mlp.experts.141.up_proj", "model.layers.18.mlp.experts.142.up_proj", "model.layers.18.mlp.experts.143.up_proj", "model.layers.18.mlp.experts.144.up_proj", "model.layers.18.mlp.experts.145.up_proj", "model.layers.18.mlp.experts.146.up_proj", "model.layers.18.mlp.experts.147.up_proj", "model.layers.18.mlp.experts.148.up_proj", "model.layers.18.mlp.experts.149.up_proj", "model.layers.18.mlp.experts.150.up_proj", "model.layers.18.mlp.experts.151.up_proj", "model.layers.18.mlp.experts.152.up_proj", "model.layers.18.mlp.experts.153.up_proj", "model.layers.18.mlp.experts.154.up_proj", "model.layers.18.mlp.experts.155.up_proj", "model.layers.18.mlp.experts.156.up_proj", "model.layers.18.mlp.experts.157.up_proj", "model.layers.18.mlp.experts.158.up_proj", "model.layers.18.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -8.151482325047255e-05, "dbits": 2516582400 }, { "dkld": -4.457980394363334e-05, "dbits": 5033164800 } ] }, { "idx": 110, "layers": [ "model.layers.18.mlp.experts.0.down_proj", "model.layers.18.mlp.experts.1.down_proj", "model.layers.18.mlp.experts.2.down_proj", "model.layers.18.mlp.experts.3.down_proj", "model.layers.18.mlp.experts.4.down_proj", "model.layers.18.mlp.experts.5.down_proj", "model.layers.18.mlp.experts.6.down_proj", "model.layers.18.mlp.experts.7.down_proj", "model.layers.18.mlp.experts.8.down_proj", "model.layers.18.mlp.experts.9.down_proj", "model.layers.18.mlp.experts.10.down_proj", "model.layers.18.mlp.experts.11.down_proj", "model.layers.18.mlp.experts.12.down_proj", "model.layers.18.mlp.experts.13.down_proj", "model.layers.18.mlp.experts.14.down_proj", "model.layers.18.mlp.experts.15.down_proj", "model.layers.18.mlp.experts.16.down_proj", "model.layers.18.mlp.experts.17.down_proj", "model.layers.18.mlp.experts.18.down_proj", "model.layers.18.mlp.experts.19.down_proj", "model.layers.18.mlp.experts.20.down_proj", "model.layers.18.mlp.experts.21.down_proj", "model.layers.18.mlp.experts.22.down_proj", "model.layers.18.mlp.experts.23.down_proj", "model.layers.18.mlp.experts.24.down_proj", "model.layers.18.mlp.experts.25.down_proj", "model.layers.18.mlp.experts.26.down_proj", "model.layers.18.mlp.experts.27.down_proj", "model.layers.18.mlp.experts.28.down_proj", "model.layers.18.mlp.experts.29.down_proj", "model.layers.18.mlp.experts.30.down_proj", "model.layers.18.mlp.experts.31.down_proj", "model.layers.18.mlp.experts.32.down_proj", "model.layers.18.mlp.experts.33.down_proj", "model.layers.18.mlp.experts.34.down_proj", "model.layers.18.mlp.experts.35.down_proj", "model.layers.18.mlp.experts.36.down_proj", "model.layers.18.mlp.experts.37.down_proj", "model.layers.18.mlp.experts.38.down_proj", "model.layers.18.mlp.experts.39.down_proj", "model.layers.18.mlp.experts.40.down_proj", "model.layers.18.mlp.experts.41.down_proj", "model.layers.18.mlp.experts.42.down_proj", "model.layers.18.mlp.experts.43.down_proj", "model.layers.18.mlp.experts.44.down_proj", "model.layers.18.mlp.experts.45.down_proj", "model.layers.18.mlp.experts.46.down_proj", "model.layers.18.mlp.experts.47.down_proj", "model.layers.18.mlp.experts.48.down_proj", "model.layers.18.mlp.experts.49.down_proj", "model.layers.18.mlp.experts.50.down_proj", "model.layers.18.mlp.experts.51.down_proj", "model.layers.18.mlp.experts.52.down_proj", "model.layers.18.mlp.experts.53.down_proj", "model.layers.18.mlp.experts.54.down_proj", "model.layers.18.mlp.experts.55.down_proj", "model.layers.18.mlp.experts.56.down_proj", "model.layers.18.mlp.experts.57.down_proj", "model.layers.18.mlp.experts.58.down_proj", "model.layers.18.mlp.experts.59.down_proj", "model.layers.18.mlp.experts.60.down_proj", "model.layers.18.mlp.experts.61.down_proj", "model.layers.18.mlp.experts.62.down_proj", "model.layers.18.mlp.experts.63.down_proj", "model.layers.18.mlp.experts.64.down_proj", "model.layers.18.mlp.experts.65.down_proj", "model.layers.18.mlp.experts.66.down_proj", "model.layers.18.mlp.experts.67.down_proj", "model.layers.18.mlp.experts.68.down_proj", "model.layers.18.mlp.experts.69.down_proj", "model.layers.18.mlp.experts.70.down_proj", "model.layers.18.mlp.experts.71.down_proj", "model.layers.18.mlp.experts.72.down_proj", "model.layers.18.mlp.experts.73.down_proj", "model.layers.18.mlp.experts.74.down_proj", "model.layers.18.mlp.experts.75.down_proj", "model.layers.18.mlp.experts.76.down_proj", "model.layers.18.mlp.experts.77.down_proj", "model.layers.18.mlp.experts.78.down_proj", "model.layers.18.mlp.experts.79.down_proj", "model.layers.18.mlp.experts.80.down_proj", "model.layers.18.mlp.experts.81.down_proj", "model.layers.18.mlp.experts.82.down_proj", "model.layers.18.mlp.experts.83.down_proj", "model.layers.18.mlp.experts.84.down_proj", "model.layers.18.mlp.experts.85.down_proj", "model.layers.18.mlp.experts.86.down_proj", "model.layers.18.mlp.experts.87.down_proj", "model.layers.18.mlp.experts.88.down_proj", "model.layers.18.mlp.experts.89.down_proj", "model.layers.18.mlp.experts.90.down_proj", "model.layers.18.mlp.experts.91.down_proj", "model.layers.18.mlp.experts.92.down_proj", "model.layers.18.mlp.experts.93.down_proj", "model.layers.18.mlp.experts.94.down_proj", "model.layers.18.mlp.experts.95.down_proj", "model.layers.18.mlp.experts.96.down_proj", "model.layers.18.mlp.experts.97.down_proj", "model.layers.18.mlp.experts.98.down_proj", "model.layers.18.mlp.experts.99.down_proj", "model.layers.18.mlp.experts.100.down_proj", "model.layers.18.mlp.experts.101.down_proj", "model.layers.18.mlp.experts.102.down_proj", "model.layers.18.mlp.experts.103.down_proj", "model.layers.18.mlp.experts.104.down_proj", "model.layers.18.mlp.experts.105.down_proj", "model.layers.18.mlp.experts.106.down_proj", "model.layers.18.mlp.experts.107.down_proj", "model.layers.18.mlp.experts.108.down_proj", "model.layers.18.mlp.experts.109.down_proj", "model.layers.18.mlp.experts.110.down_proj", "model.layers.18.mlp.experts.111.down_proj", "model.layers.18.mlp.experts.112.down_proj", "model.layers.18.mlp.experts.113.down_proj", "model.layers.18.mlp.experts.114.down_proj", "model.layers.18.mlp.experts.115.down_proj", "model.layers.18.mlp.experts.116.down_proj", "model.layers.18.mlp.experts.117.down_proj", "model.layers.18.mlp.experts.118.down_proj", "model.layers.18.mlp.experts.119.down_proj", "model.layers.18.mlp.experts.120.down_proj", "model.layers.18.mlp.experts.121.down_proj", "model.layers.18.mlp.experts.122.down_proj", "model.layers.18.mlp.experts.123.down_proj", "model.layers.18.mlp.experts.124.down_proj", "model.layers.18.mlp.experts.125.down_proj", "model.layers.18.mlp.experts.126.down_proj", "model.layers.18.mlp.experts.127.down_proj", "model.layers.18.mlp.experts.128.down_proj", "model.layers.18.mlp.experts.129.down_proj", "model.layers.18.mlp.experts.130.down_proj", "model.layers.18.mlp.experts.131.down_proj", "model.layers.18.mlp.experts.132.down_proj", "model.layers.18.mlp.experts.133.down_proj", "model.layers.18.mlp.experts.134.down_proj", "model.layers.18.mlp.experts.135.down_proj", "model.layers.18.mlp.experts.136.down_proj", "model.layers.18.mlp.experts.137.down_proj", "model.layers.18.mlp.experts.138.down_proj", "model.layers.18.mlp.experts.139.down_proj", "model.layers.18.mlp.experts.140.down_proj", "model.layers.18.mlp.experts.141.down_proj", "model.layers.18.mlp.experts.142.down_proj", "model.layers.18.mlp.experts.143.down_proj", "model.layers.18.mlp.experts.144.down_proj", "model.layers.18.mlp.experts.145.down_proj", "model.layers.18.mlp.experts.146.down_proj", "model.layers.18.mlp.experts.147.down_proj", "model.layers.18.mlp.experts.148.down_proj", "model.layers.18.mlp.experts.149.down_proj", "model.layers.18.mlp.experts.150.down_proj", "model.layers.18.mlp.experts.151.down_proj", "model.layers.18.mlp.experts.152.down_proj", "model.layers.18.mlp.experts.153.down_proj", "model.layers.18.mlp.experts.154.down_proj", "model.layers.18.mlp.experts.155.down_proj", "model.layers.18.mlp.experts.156.down_proj", "model.layers.18.mlp.experts.157.down_proj", "model.layers.18.mlp.experts.158.down_proj", "model.layers.18.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -4.2371870949863694e-05, "dbits": 1258291200 }, { "dkld": -9.437007829546894e-05, "dbits": 2516582400 } ] }, { "idx": 111, "layers": [ "model.layers.19.self_attn.q_proj" ], "candidates": [ { "dkld": -5.4739462211727055e-05, "dbits": 62914560 }, { "dkld": -5.4339878261089325e-05, "dbits": 125829120 } ] }, { "idx": 112, "layers": [ "model.layers.19.self_attn.k_proj", "model.layers.19.self_attn.v_proj" ], "candidates": [ { "dkld": -1.1081341654058802e-06, "dbits": 10485760 }, { "dkld": -7.02819088473916e-05, "dbits": 20971520 } ] }, { "idx": 113, "layers": [ "model.layers.19.self_attn.o_proj" ], "candidates": [ { "dkld": -5.546812899410655e-05, "dbits": 62914560 }, { "dkld": -4.876132588833501e-05, "dbits": 125829120 } ] }, { "idx": 114, "layers": [ "model.layers.19.mlp.shared_experts.gate_proj", "model.layers.19.mlp.shared_experts.up_proj", "model.layers.19.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 0.0002007071860134612, "dbits": 23592960 }, { "dkld": 0.0002014078665524728, "dbits": 47185920 } ] }, { "idx": 115, "layers": [ "model.layers.19.mlp.experts.0.gate_proj", "model.layers.19.mlp.experts.1.gate_proj", "model.layers.19.mlp.experts.2.gate_proj", "model.layers.19.mlp.experts.3.gate_proj", "model.layers.19.mlp.experts.4.gate_proj", "model.layers.19.mlp.experts.5.gate_proj", "model.layers.19.mlp.experts.6.gate_proj", "model.layers.19.mlp.experts.7.gate_proj", "model.layers.19.mlp.experts.8.gate_proj", "model.layers.19.mlp.experts.9.gate_proj", "model.layers.19.mlp.experts.10.gate_proj", "model.layers.19.mlp.experts.11.gate_proj", "model.layers.19.mlp.experts.12.gate_proj", "model.layers.19.mlp.experts.13.gate_proj", "model.layers.19.mlp.experts.14.gate_proj", "model.layers.19.mlp.experts.15.gate_proj", "model.layers.19.mlp.experts.16.gate_proj", "model.layers.19.mlp.experts.17.gate_proj", "model.layers.19.mlp.experts.18.gate_proj", "model.layers.19.mlp.experts.19.gate_proj", "model.layers.19.mlp.experts.20.gate_proj", "model.layers.19.mlp.experts.21.gate_proj", "model.layers.19.mlp.experts.22.gate_proj", "model.layers.19.mlp.experts.23.gate_proj", "model.layers.19.mlp.experts.24.gate_proj", "model.layers.19.mlp.experts.25.gate_proj", "model.layers.19.mlp.experts.26.gate_proj", "model.layers.19.mlp.experts.27.gate_proj", "model.layers.19.mlp.experts.28.gate_proj", "model.layers.19.mlp.experts.29.gate_proj", "model.layers.19.mlp.experts.30.gate_proj", "model.layers.19.mlp.experts.31.gate_proj", "model.layers.19.mlp.experts.32.gate_proj", "model.layers.19.mlp.experts.33.gate_proj", "model.layers.19.mlp.experts.34.gate_proj", "model.layers.19.mlp.experts.35.gate_proj", "model.layers.19.mlp.experts.36.gate_proj", "model.layers.19.mlp.experts.37.gate_proj", "model.layers.19.mlp.experts.38.gate_proj", "model.layers.19.mlp.experts.39.gate_proj", "model.layers.19.mlp.experts.40.gate_proj", "model.layers.19.mlp.experts.41.gate_proj", "model.layers.19.mlp.experts.42.gate_proj", "model.layers.19.mlp.experts.43.gate_proj", "model.layers.19.mlp.experts.44.gate_proj", "model.layers.19.mlp.experts.45.gate_proj", "model.layers.19.mlp.experts.46.gate_proj", "model.layers.19.mlp.experts.47.gate_proj", "model.layers.19.mlp.experts.48.gate_proj", "model.layers.19.mlp.experts.49.gate_proj", "model.layers.19.mlp.experts.50.gate_proj", "model.layers.19.mlp.experts.51.gate_proj", "model.layers.19.mlp.experts.52.gate_proj", "model.layers.19.mlp.experts.53.gate_proj", "model.layers.19.mlp.experts.54.gate_proj", "model.layers.19.mlp.experts.55.gate_proj", "model.layers.19.mlp.experts.56.gate_proj", "model.layers.19.mlp.experts.57.gate_proj", "model.layers.19.mlp.experts.58.gate_proj", "model.layers.19.mlp.experts.59.gate_proj", "model.layers.19.mlp.experts.60.gate_proj", "model.layers.19.mlp.experts.61.gate_proj", "model.layers.19.mlp.experts.62.gate_proj", "model.layers.19.mlp.experts.63.gate_proj", "model.layers.19.mlp.experts.64.gate_proj", "model.layers.19.mlp.experts.65.gate_proj", "model.layers.19.mlp.experts.66.gate_proj", "model.layers.19.mlp.experts.67.gate_proj", "model.layers.19.mlp.experts.68.gate_proj", "model.layers.19.mlp.experts.69.gate_proj", "model.layers.19.mlp.experts.70.gate_proj", "model.layers.19.mlp.experts.71.gate_proj", "model.layers.19.mlp.experts.72.gate_proj", "model.layers.19.mlp.experts.73.gate_proj", "model.layers.19.mlp.experts.74.gate_proj", "model.layers.19.mlp.experts.75.gate_proj", "model.layers.19.mlp.experts.76.gate_proj", "model.layers.19.mlp.experts.77.gate_proj", "model.layers.19.mlp.experts.78.gate_proj", "model.layers.19.mlp.experts.79.gate_proj", "model.layers.19.mlp.experts.80.gate_proj", "model.layers.19.mlp.experts.81.gate_proj", "model.layers.19.mlp.experts.82.gate_proj", "model.layers.19.mlp.experts.83.gate_proj", "model.layers.19.mlp.experts.84.gate_proj", "model.layers.19.mlp.experts.85.gate_proj", "model.layers.19.mlp.experts.86.gate_proj", "model.layers.19.mlp.experts.87.gate_proj", "model.layers.19.mlp.experts.88.gate_proj", "model.layers.19.mlp.experts.89.gate_proj", "model.layers.19.mlp.experts.90.gate_proj", "model.layers.19.mlp.experts.91.gate_proj", "model.layers.19.mlp.experts.92.gate_proj", "model.layers.19.mlp.experts.93.gate_proj", "model.layers.19.mlp.experts.94.gate_proj", "model.layers.19.mlp.experts.95.gate_proj", "model.layers.19.mlp.experts.96.gate_proj", "model.layers.19.mlp.experts.97.gate_proj", "model.layers.19.mlp.experts.98.gate_proj", "model.layers.19.mlp.experts.99.gate_proj", "model.layers.19.mlp.experts.100.gate_proj", "model.layers.19.mlp.experts.101.gate_proj", "model.layers.19.mlp.experts.102.gate_proj", "model.layers.19.mlp.experts.103.gate_proj", "model.layers.19.mlp.experts.104.gate_proj", "model.layers.19.mlp.experts.105.gate_proj", "model.layers.19.mlp.experts.106.gate_proj", "model.layers.19.mlp.experts.107.gate_proj", "model.layers.19.mlp.experts.108.gate_proj", "model.layers.19.mlp.experts.109.gate_proj", "model.layers.19.mlp.experts.110.gate_proj", "model.layers.19.mlp.experts.111.gate_proj", "model.layers.19.mlp.experts.112.gate_proj", "model.layers.19.mlp.experts.113.gate_proj", "model.layers.19.mlp.experts.114.gate_proj", "model.layers.19.mlp.experts.115.gate_proj", "model.layers.19.mlp.experts.116.gate_proj", "model.layers.19.mlp.experts.117.gate_proj", "model.layers.19.mlp.experts.118.gate_proj", "model.layers.19.mlp.experts.119.gate_proj", "model.layers.19.mlp.experts.120.gate_proj", "model.layers.19.mlp.experts.121.gate_proj", "model.layers.19.mlp.experts.122.gate_proj", "model.layers.19.mlp.experts.123.gate_proj", "model.layers.19.mlp.experts.124.gate_proj", "model.layers.19.mlp.experts.125.gate_proj", "model.layers.19.mlp.experts.126.gate_proj", "model.layers.19.mlp.experts.127.gate_proj", "model.layers.19.mlp.experts.128.gate_proj", "model.layers.19.mlp.experts.129.gate_proj", "model.layers.19.mlp.experts.130.gate_proj", "model.layers.19.mlp.experts.131.gate_proj", "model.layers.19.mlp.experts.132.gate_proj", "model.layers.19.mlp.experts.133.gate_proj", "model.layers.19.mlp.experts.134.gate_proj", "model.layers.19.mlp.experts.135.gate_proj", "model.layers.19.mlp.experts.136.gate_proj", "model.layers.19.mlp.experts.137.gate_proj", "model.layers.19.mlp.experts.138.gate_proj", "model.layers.19.mlp.experts.139.gate_proj", "model.layers.19.mlp.experts.140.gate_proj", "model.layers.19.mlp.experts.141.gate_proj", "model.layers.19.mlp.experts.142.gate_proj", "model.layers.19.mlp.experts.143.gate_proj", "model.layers.19.mlp.experts.144.gate_proj", "model.layers.19.mlp.experts.145.gate_proj", "model.layers.19.mlp.experts.146.gate_proj", "model.layers.19.mlp.experts.147.gate_proj", "model.layers.19.mlp.experts.148.gate_proj", "model.layers.19.mlp.experts.149.gate_proj", "model.layers.19.mlp.experts.150.gate_proj", "model.layers.19.mlp.experts.151.gate_proj", "model.layers.19.mlp.experts.152.gate_proj", "model.layers.19.mlp.experts.153.gate_proj", "model.layers.19.mlp.experts.154.gate_proj", "model.layers.19.mlp.experts.155.gate_proj", "model.layers.19.mlp.experts.156.gate_proj", "model.layers.19.mlp.experts.157.gate_proj", "model.layers.19.mlp.experts.158.gate_proj", "model.layers.19.mlp.experts.159.gate_proj", "model.layers.19.mlp.experts.0.up_proj", "model.layers.19.mlp.experts.1.up_proj", "model.layers.19.mlp.experts.2.up_proj", "model.layers.19.mlp.experts.3.up_proj", "model.layers.19.mlp.experts.4.up_proj", "model.layers.19.mlp.experts.5.up_proj", "model.layers.19.mlp.experts.6.up_proj", "model.layers.19.mlp.experts.7.up_proj", "model.layers.19.mlp.experts.8.up_proj", "model.layers.19.mlp.experts.9.up_proj", "model.layers.19.mlp.experts.10.up_proj", "model.layers.19.mlp.experts.11.up_proj", "model.layers.19.mlp.experts.12.up_proj", "model.layers.19.mlp.experts.13.up_proj", "model.layers.19.mlp.experts.14.up_proj", "model.layers.19.mlp.experts.15.up_proj", "model.layers.19.mlp.experts.16.up_proj", "model.layers.19.mlp.experts.17.up_proj", "model.layers.19.mlp.experts.18.up_proj", "model.layers.19.mlp.experts.19.up_proj", "model.layers.19.mlp.experts.20.up_proj", "model.layers.19.mlp.experts.21.up_proj", "model.layers.19.mlp.experts.22.up_proj", "model.layers.19.mlp.experts.23.up_proj", "model.layers.19.mlp.experts.24.up_proj", "model.layers.19.mlp.experts.25.up_proj", "model.layers.19.mlp.experts.26.up_proj", "model.layers.19.mlp.experts.27.up_proj", "model.layers.19.mlp.experts.28.up_proj", "model.layers.19.mlp.experts.29.up_proj", "model.layers.19.mlp.experts.30.up_proj", "model.layers.19.mlp.experts.31.up_proj", "model.layers.19.mlp.experts.32.up_proj", "model.layers.19.mlp.experts.33.up_proj", "model.layers.19.mlp.experts.34.up_proj", "model.layers.19.mlp.experts.35.up_proj", "model.layers.19.mlp.experts.36.up_proj", "model.layers.19.mlp.experts.37.up_proj", "model.layers.19.mlp.experts.38.up_proj", "model.layers.19.mlp.experts.39.up_proj", "model.layers.19.mlp.experts.40.up_proj", "model.layers.19.mlp.experts.41.up_proj", "model.layers.19.mlp.experts.42.up_proj", "model.layers.19.mlp.experts.43.up_proj", "model.layers.19.mlp.experts.44.up_proj", "model.layers.19.mlp.experts.45.up_proj", "model.layers.19.mlp.experts.46.up_proj", "model.layers.19.mlp.experts.47.up_proj", "model.layers.19.mlp.experts.48.up_proj", "model.layers.19.mlp.experts.49.up_proj", "model.layers.19.mlp.experts.50.up_proj", "model.layers.19.mlp.experts.51.up_proj", "model.layers.19.mlp.experts.52.up_proj", "model.layers.19.mlp.experts.53.up_proj", "model.layers.19.mlp.experts.54.up_proj", "model.layers.19.mlp.experts.55.up_proj", "model.layers.19.mlp.experts.56.up_proj", "model.layers.19.mlp.experts.57.up_proj", "model.layers.19.mlp.experts.58.up_proj", "model.layers.19.mlp.experts.59.up_proj", "model.layers.19.mlp.experts.60.up_proj", "model.layers.19.mlp.experts.61.up_proj", "model.layers.19.mlp.experts.62.up_proj", "model.layers.19.mlp.experts.63.up_proj", "model.layers.19.mlp.experts.64.up_proj", "model.layers.19.mlp.experts.65.up_proj", "model.layers.19.mlp.experts.66.up_proj", "model.layers.19.mlp.experts.67.up_proj", "model.layers.19.mlp.experts.68.up_proj", "model.layers.19.mlp.experts.69.up_proj", "model.layers.19.mlp.experts.70.up_proj", "model.layers.19.mlp.experts.71.up_proj", "model.layers.19.mlp.experts.72.up_proj", "model.layers.19.mlp.experts.73.up_proj", "model.layers.19.mlp.experts.74.up_proj", "model.layers.19.mlp.experts.75.up_proj", "model.layers.19.mlp.experts.76.up_proj", "model.layers.19.mlp.experts.77.up_proj", "model.layers.19.mlp.experts.78.up_proj", "model.layers.19.mlp.experts.79.up_proj", "model.layers.19.mlp.experts.80.up_proj", "model.layers.19.mlp.experts.81.up_proj", "model.layers.19.mlp.experts.82.up_proj", "model.layers.19.mlp.experts.83.up_proj", "model.layers.19.mlp.experts.84.up_proj", "model.layers.19.mlp.experts.85.up_proj", "model.layers.19.mlp.experts.86.up_proj", "model.layers.19.mlp.experts.87.up_proj", "model.layers.19.mlp.experts.88.up_proj", "model.layers.19.mlp.experts.89.up_proj", "model.layers.19.mlp.experts.90.up_proj", "model.layers.19.mlp.experts.91.up_proj", "model.layers.19.mlp.experts.92.up_proj", "model.layers.19.mlp.experts.93.up_proj", "model.layers.19.mlp.experts.94.up_proj", "model.layers.19.mlp.experts.95.up_proj", "model.layers.19.mlp.experts.96.up_proj", "model.layers.19.mlp.experts.97.up_proj", "model.layers.19.mlp.experts.98.up_proj", "model.layers.19.mlp.experts.99.up_proj", "model.layers.19.mlp.experts.100.up_proj", "model.layers.19.mlp.experts.101.up_proj", "model.layers.19.mlp.experts.102.up_proj", "model.layers.19.mlp.experts.103.up_proj", "model.layers.19.mlp.experts.104.up_proj", "model.layers.19.mlp.experts.105.up_proj", "model.layers.19.mlp.experts.106.up_proj", "model.layers.19.mlp.experts.107.up_proj", "model.layers.19.mlp.experts.108.up_proj", "model.layers.19.mlp.experts.109.up_proj", "model.layers.19.mlp.experts.110.up_proj", "model.layers.19.mlp.experts.111.up_proj", "model.layers.19.mlp.experts.112.up_proj", "model.layers.19.mlp.experts.113.up_proj", "model.layers.19.mlp.experts.114.up_proj", "model.layers.19.mlp.experts.115.up_proj", "model.layers.19.mlp.experts.116.up_proj", "model.layers.19.mlp.experts.117.up_proj", "model.layers.19.mlp.experts.118.up_proj", "model.layers.19.mlp.experts.119.up_proj", "model.layers.19.mlp.experts.120.up_proj", "model.layers.19.mlp.experts.121.up_proj", "model.layers.19.mlp.experts.122.up_proj", "model.layers.19.mlp.experts.123.up_proj", "model.layers.19.mlp.experts.124.up_proj", "model.layers.19.mlp.experts.125.up_proj", "model.layers.19.mlp.experts.126.up_proj", "model.layers.19.mlp.experts.127.up_proj", "model.layers.19.mlp.experts.128.up_proj", "model.layers.19.mlp.experts.129.up_proj", "model.layers.19.mlp.experts.130.up_proj", "model.layers.19.mlp.experts.131.up_proj", "model.layers.19.mlp.experts.132.up_proj", "model.layers.19.mlp.experts.133.up_proj", "model.layers.19.mlp.experts.134.up_proj", "model.layers.19.mlp.experts.135.up_proj", "model.layers.19.mlp.experts.136.up_proj", "model.layers.19.mlp.experts.137.up_proj", "model.layers.19.mlp.experts.138.up_proj", "model.layers.19.mlp.experts.139.up_proj", "model.layers.19.mlp.experts.140.up_proj", "model.layers.19.mlp.experts.141.up_proj", "model.layers.19.mlp.experts.142.up_proj", "model.layers.19.mlp.experts.143.up_proj", "model.layers.19.mlp.experts.144.up_proj", "model.layers.19.mlp.experts.145.up_proj", "model.layers.19.mlp.experts.146.up_proj", "model.layers.19.mlp.experts.147.up_proj", "model.layers.19.mlp.experts.148.up_proj", "model.layers.19.mlp.experts.149.up_proj", "model.layers.19.mlp.experts.150.up_proj", "model.layers.19.mlp.experts.151.up_proj", "model.layers.19.mlp.experts.152.up_proj", "model.layers.19.mlp.experts.153.up_proj", "model.layers.19.mlp.experts.154.up_proj", "model.layers.19.mlp.experts.155.up_proj", "model.layers.19.mlp.experts.156.up_proj", "model.layers.19.mlp.experts.157.up_proj", "model.layers.19.mlp.experts.158.up_proj", "model.layers.19.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -6.799313705414464e-05, "dbits": 2516582400 }, { "dkld": -6.95705413818349e-05, "dbits": 5033164800 } ] }, { "idx": 116, "layers": [ "model.layers.19.mlp.experts.0.down_proj", "model.layers.19.mlp.experts.1.down_proj", "model.layers.19.mlp.experts.2.down_proj", "model.layers.19.mlp.experts.3.down_proj", "model.layers.19.mlp.experts.4.down_proj", "model.layers.19.mlp.experts.5.down_proj", "model.layers.19.mlp.experts.6.down_proj", "model.layers.19.mlp.experts.7.down_proj", "model.layers.19.mlp.experts.8.down_proj", "model.layers.19.mlp.experts.9.down_proj", "model.layers.19.mlp.experts.10.down_proj", "model.layers.19.mlp.experts.11.down_proj", "model.layers.19.mlp.experts.12.down_proj", "model.layers.19.mlp.experts.13.down_proj", "model.layers.19.mlp.experts.14.down_proj", "model.layers.19.mlp.experts.15.down_proj", "model.layers.19.mlp.experts.16.down_proj", "model.layers.19.mlp.experts.17.down_proj", "model.layers.19.mlp.experts.18.down_proj", "model.layers.19.mlp.experts.19.down_proj", "model.layers.19.mlp.experts.20.down_proj", "model.layers.19.mlp.experts.21.down_proj", "model.layers.19.mlp.experts.22.down_proj", "model.layers.19.mlp.experts.23.down_proj", "model.layers.19.mlp.experts.24.down_proj", "model.layers.19.mlp.experts.25.down_proj", "model.layers.19.mlp.experts.26.down_proj", "model.layers.19.mlp.experts.27.down_proj", "model.layers.19.mlp.experts.28.down_proj", "model.layers.19.mlp.experts.29.down_proj", "model.layers.19.mlp.experts.30.down_proj", "model.layers.19.mlp.experts.31.down_proj", "model.layers.19.mlp.experts.32.down_proj", "model.layers.19.mlp.experts.33.down_proj", "model.layers.19.mlp.experts.34.down_proj", "model.layers.19.mlp.experts.35.down_proj", "model.layers.19.mlp.experts.36.down_proj", "model.layers.19.mlp.experts.37.down_proj", "model.layers.19.mlp.experts.38.down_proj", "model.layers.19.mlp.experts.39.down_proj", "model.layers.19.mlp.experts.40.down_proj", "model.layers.19.mlp.experts.41.down_proj", "model.layers.19.mlp.experts.42.down_proj", "model.layers.19.mlp.experts.43.down_proj", "model.layers.19.mlp.experts.44.down_proj", "model.layers.19.mlp.experts.45.down_proj", "model.layers.19.mlp.experts.46.down_proj", "model.layers.19.mlp.experts.47.down_proj", "model.layers.19.mlp.experts.48.down_proj", "model.layers.19.mlp.experts.49.down_proj", "model.layers.19.mlp.experts.50.down_proj", "model.layers.19.mlp.experts.51.down_proj", "model.layers.19.mlp.experts.52.down_proj", "model.layers.19.mlp.experts.53.down_proj", "model.layers.19.mlp.experts.54.down_proj", "model.layers.19.mlp.experts.55.down_proj", "model.layers.19.mlp.experts.56.down_proj", "model.layers.19.mlp.experts.57.down_proj", "model.layers.19.mlp.experts.58.down_proj", "model.layers.19.mlp.experts.59.down_proj", "model.layers.19.mlp.experts.60.down_proj", "model.layers.19.mlp.experts.61.down_proj", "model.layers.19.mlp.experts.62.down_proj", "model.layers.19.mlp.experts.63.down_proj", "model.layers.19.mlp.experts.64.down_proj", "model.layers.19.mlp.experts.65.down_proj", "model.layers.19.mlp.experts.66.down_proj", "model.layers.19.mlp.experts.67.down_proj", "model.layers.19.mlp.experts.68.down_proj", "model.layers.19.mlp.experts.69.down_proj", "model.layers.19.mlp.experts.70.down_proj", "model.layers.19.mlp.experts.71.down_proj", "model.layers.19.mlp.experts.72.down_proj", "model.layers.19.mlp.experts.73.down_proj", "model.layers.19.mlp.experts.74.down_proj", "model.layers.19.mlp.experts.75.down_proj", "model.layers.19.mlp.experts.76.down_proj", "model.layers.19.mlp.experts.77.down_proj", "model.layers.19.mlp.experts.78.down_proj", "model.layers.19.mlp.experts.79.down_proj", "model.layers.19.mlp.experts.80.down_proj", "model.layers.19.mlp.experts.81.down_proj", "model.layers.19.mlp.experts.82.down_proj", "model.layers.19.mlp.experts.83.down_proj", "model.layers.19.mlp.experts.84.down_proj", "model.layers.19.mlp.experts.85.down_proj", "model.layers.19.mlp.experts.86.down_proj", "model.layers.19.mlp.experts.87.down_proj", "model.layers.19.mlp.experts.88.down_proj", "model.layers.19.mlp.experts.89.down_proj", "model.layers.19.mlp.experts.90.down_proj", "model.layers.19.mlp.experts.91.down_proj", "model.layers.19.mlp.experts.92.down_proj", "model.layers.19.mlp.experts.93.down_proj", "model.layers.19.mlp.experts.94.down_proj", "model.layers.19.mlp.experts.95.down_proj", "model.layers.19.mlp.experts.96.down_proj", "model.layers.19.mlp.experts.97.down_proj", "model.layers.19.mlp.experts.98.down_proj", "model.layers.19.mlp.experts.99.down_proj", "model.layers.19.mlp.experts.100.down_proj", "model.layers.19.mlp.experts.101.down_proj", "model.layers.19.mlp.experts.102.down_proj", "model.layers.19.mlp.experts.103.down_proj", "model.layers.19.mlp.experts.104.down_proj", "model.layers.19.mlp.experts.105.down_proj", "model.layers.19.mlp.experts.106.down_proj", "model.layers.19.mlp.experts.107.down_proj", "model.layers.19.mlp.experts.108.down_proj", "model.layers.19.mlp.experts.109.down_proj", "model.layers.19.mlp.experts.110.down_proj", "model.layers.19.mlp.experts.111.down_proj", "model.layers.19.mlp.experts.112.down_proj", "model.layers.19.mlp.experts.113.down_proj", "model.layers.19.mlp.experts.114.down_proj", "model.layers.19.mlp.experts.115.down_proj", "model.layers.19.mlp.experts.116.down_proj", "model.layers.19.mlp.experts.117.down_proj", "model.layers.19.mlp.experts.118.down_proj", "model.layers.19.mlp.experts.119.down_proj", "model.layers.19.mlp.experts.120.down_proj", "model.layers.19.mlp.experts.121.down_proj", "model.layers.19.mlp.experts.122.down_proj", "model.layers.19.mlp.experts.123.down_proj", "model.layers.19.mlp.experts.124.down_proj", "model.layers.19.mlp.experts.125.down_proj", "model.layers.19.mlp.experts.126.down_proj", "model.layers.19.mlp.experts.127.down_proj", "model.layers.19.mlp.experts.128.down_proj", "model.layers.19.mlp.experts.129.down_proj", "model.layers.19.mlp.experts.130.down_proj", "model.layers.19.mlp.experts.131.down_proj", "model.layers.19.mlp.experts.132.down_proj", "model.layers.19.mlp.experts.133.down_proj", "model.layers.19.mlp.experts.134.down_proj", "model.layers.19.mlp.experts.135.down_proj", "model.layers.19.mlp.experts.136.down_proj", "model.layers.19.mlp.experts.137.down_proj", "model.layers.19.mlp.experts.138.down_proj", "model.layers.19.mlp.experts.139.down_proj", "model.layers.19.mlp.experts.140.down_proj", "model.layers.19.mlp.experts.141.down_proj", "model.layers.19.mlp.experts.142.down_proj", "model.layers.19.mlp.experts.143.down_proj", "model.layers.19.mlp.experts.144.down_proj", "model.layers.19.mlp.experts.145.down_proj", "model.layers.19.mlp.experts.146.down_proj", "model.layers.19.mlp.experts.147.down_proj", "model.layers.19.mlp.experts.148.down_proj", "model.layers.19.mlp.experts.149.down_proj", "model.layers.19.mlp.experts.150.down_proj", "model.layers.19.mlp.experts.151.down_proj", "model.layers.19.mlp.experts.152.down_proj", "model.layers.19.mlp.experts.153.down_proj", "model.layers.19.mlp.experts.154.down_proj", "model.layers.19.mlp.experts.155.down_proj", "model.layers.19.mlp.experts.156.down_proj", "model.layers.19.mlp.experts.157.down_proj", "model.layers.19.mlp.experts.158.down_proj", "model.layers.19.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.4184095673262726e-05, "dbits": 1258291200 }, { "dkld": -6.127962842583656e-05, "dbits": 2516582400 } ] }, { "idx": 117, "layers": [ "model.layers.20.self_attn.q_proj" ], "candidates": [ { "dkld": 1.7753615975380638e-05, "dbits": 62914560 }, { "dkld": 2.2864714264870384e-05, "dbits": 125829120 } ] }, { "idx": 118, "layers": [ "model.layers.20.self_attn.k_proj", "model.layers.20.self_attn.v_proj" ], "candidates": [ { "dkld": -9.021586738526717e-05, "dbits": 10485760 }, { "dkld": -3.4531997516750595e-05, "dbits": 20971520 } ] }, { "idx": 119, "layers": [ "model.layers.20.self_attn.o_proj" ], "candidates": [ { "dkld": -0.0002573053818196048, "dbits": 62914560 }, { "dkld": -0.00019657644443213905, "dbits": 125829120 } ] }, { "idx": 120, "layers": [ "model.layers.20.mlp.shared_experts.gate_proj", "model.layers.20.mlp.shared_experts.up_proj", "model.layers.20.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.00023248274810612132, "dbits": 23592960 }, { "dkld": -0.00026599431876093114, "dbits": 47185920 } ] }, { "idx": 121, "layers": [ "model.layers.20.mlp.experts.0.gate_proj", "model.layers.20.mlp.experts.1.gate_proj", "model.layers.20.mlp.experts.2.gate_proj", "model.layers.20.mlp.experts.3.gate_proj", "model.layers.20.mlp.experts.4.gate_proj", "model.layers.20.mlp.experts.5.gate_proj", "model.layers.20.mlp.experts.6.gate_proj", "model.layers.20.mlp.experts.7.gate_proj", "model.layers.20.mlp.experts.8.gate_proj", "model.layers.20.mlp.experts.9.gate_proj", "model.layers.20.mlp.experts.10.gate_proj", "model.layers.20.mlp.experts.11.gate_proj", "model.layers.20.mlp.experts.12.gate_proj", "model.layers.20.mlp.experts.13.gate_proj", "model.layers.20.mlp.experts.14.gate_proj", "model.layers.20.mlp.experts.15.gate_proj", "model.layers.20.mlp.experts.16.gate_proj", "model.layers.20.mlp.experts.17.gate_proj", "model.layers.20.mlp.experts.18.gate_proj", "model.layers.20.mlp.experts.19.gate_proj", "model.layers.20.mlp.experts.20.gate_proj", "model.layers.20.mlp.experts.21.gate_proj", "model.layers.20.mlp.experts.22.gate_proj", "model.layers.20.mlp.experts.23.gate_proj", "model.layers.20.mlp.experts.24.gate_proj", "model.layers.20.mlp.experts.25.gate_proj", "model.layers.20.mlp.experts.26.gate_proj", "model.layers.20.mlp.experts.27.gate_proj", "model.layers.20.mlp.experts.28.gate_proj", "model.layers.20.mlp.experts.29.gate_proj", "model.layers.20.mlp.experts.30.gate_proj", "model.layers.20.mlp.experts.31.gate_proj", "model.layers.20.mlp.experts.32.gate_proj", "model.layers.20.mlp.experts.33.gate_proj", "model.layers.20.mlp.experts.34.gate_proj", "model.layers.20.mlp.experts.35.gate_proj", "model.layers.20.mlp.experts.36.gate_proj", "model.layers.20.mlp.experts.37.gate_proj", "model.layers.20.mlp.experts.38.gate_proj", "model.layers.20.mlp.experts.39.gate_proj", "model.layers.20.mlp.experts.40.gate_proj", "model.layers.20.mlp.experts.41.gate_proj", "model.layers.20.mlp.experts.42.gate_proj", "model.layers.20.mlp.experts.43.gate_proj", "model.layers.20.mlp.experts.44.gate_proj", "model.layers.20.mlp.experts.45.gate_proj", "model.layers.20.mlp.experts.46.gate_proj", "model.layers.20.mlp.experts.47.gate_proj", "model.layers.20.mlp.experts.48.gate_proj", "model.layers.20.mlp.experts.49.gate_proj", "model.layers.20.mlp.experts.50.gate_proj", "model.layers.20.mlp.experts.51.gate_proj", "model.layers.20.mlp.experts.52.gate_proj", "model.layers.20.mlp.experts.53.gate_proj", "model.layers.20.mlp.experts.54.gate_proj", "model.layers.20.mlp.experts.55.gate_proj", "model.layers.20.mlp.experts.56.gate_proj", "model.layers.20.mlp.experts.57.gate_proj", "model.layers.20.mlp.experts.58.gate_proj", "model.layers.20.mlp.experts.59.gate_proj", "model.layers.20.mlp.experts.60.gate_proj", "model.layers.20.mlp.experts.61.gate_proj", "model.layers.20.mlp.experts.62.gate_proj", "model.layers.20.mlp.experts.63.gate_proj", "model.layers.20.mlp.experts.64.gate_proj", "model.layers.20.mlp.experts.65.gate_proj", "model.layers.20.mlp.experts.66.gate_proj", "model.layers.20.mlp.experts.67.gate_proj", "model.layers.20.mlp.experts.68.gate_proj", "model.layers.20.mlp.experts.69.gate_proj", "model.layers.20.mlp.experts.70.gate_proj", "model.layers.20.mlp.experts.71.gate_proj", "model.layers.20.mlp.experts.72.gate_proj", "model.layers.20.mlp.experts.73.gate_proj", "model.layers.20.mlp.experts.74.gate_proj", "model.layers.20.mlp.experts.75.gate_proj", "model.layers.20.mlp.experts.76.gate_proj", "model.layers.20.mlp.experts.77.gate_proj", "model.layers.20.mlp.experts.78.gate_proj", "model.layers.20.mlp.experts.79.gate_proj", "model.layers.20.mlp.experts.80.gate_proj", "model.layers.20.mlp.experts.81.gate_proj", "model.layers.20.mlp.experts.82.gate_proj", "model.layers.20.mlp.experts.83.gate_proj", "model.layers.20.mlp.experts.84.gate_proj", "model.layers.20.mlp.experts.85.gate_proj", "model.layers.20.mlp.experts.86.gate_proj", "model.layers.20.mlp.experts.87.gate_proj", "model.layers.20.mlp.experts.88.gate_proj", "model.layers.20.mlp.experts.89.gate_proj", "model.layers.20.mlp.experts.90.gate_proj", "model.layers.20.mlp.experts.91.gate_proj", "model.layers.20.mlp.experts.92.gate_proj", "model.layers.20.mlp.experts.93.gate_proj", "model.layers.20.mlp.experts.94.gate_proj", "model.layers.20.mlp.experts.95.gate_proj", "model.layers.20.mlp.experts.96.gate_proj", "model.layers.20.mlp.experts.97.gate_proj", "model.layers.20.mlp.experts.98.gate_proj", "model.layers.20.mlp.experts.99.gate_proj", "model.layers.20.mlp.experts.100.gate_proj", "model.layers.20.mlp.experts.101.gate_proj", "model.layers.20.mlp.experts.102.gate_proj", "model.layers.20.mlp.experts.103.gate_proj", "model.layers.20.mlp.experts.104.gate_proj", "model.layers.20.mlp.experts.105.gate_proj", "model.layers.20.mlp.experts.106.gate_proj", "model.layers.20.mlp.experts.107.gate_proj", "model.layers.20.mlp.experts.108.gate_proj", "model.layers.20.mlp.experts.109.gate_proj", "model.layers.20.mlp.experts.110.gate_proj", "model.layers.20.mlp.experts.111.gate_proj", "model.layers.20.mlp.experts.112.gate_proj", "model.layers.20.mlp.experts.113.gate_proj", "model.layers.20.mlp.experts.114.gate_proj", "model.layers.20.mlp.experts.115.gate_proj", "model.layers.20.mlp.experts.116.gate_proj", "model.layers.20.mlp.experts.117.gate_proj", "model.layers.20.mlp.experts.118.gate_proj", "model.layers.20.mlp.experts.119.gate_proj", "model.layers.20.mlp.experts.120.gate_proj", "model.layers.20.mlp.experts.121.gate_proj", "model.layers.20.mlp.experts.122.gate_proj", "model.layers.20.mlp.experts.123.gate_proj", "model.layers.20.mlp.experts.124.gate_proj", "model.layers.20.mlp.experts.125.gate_proj", "model.layers.20.mlp.experts.126.gate_proj", "model.layers.20.mlp.experts.127.gate_proj", "model.layers.20.mlp.experts.128.gate_proj", "model.layers.20.mlp.experts.129.gate_proj", "model.layers.20.mlp.experts.130.gate_proj", "model.layers.20.mlp.experts.131.gate_proj", "model.layers.20.mlp.experts.132.gate_proj", "model.layers.20.mlp.experts.133.gate_proj", "model.layers.20.mlp.experts.134.gate_proj", "model.layers.20.mlp.experts.135.gate_proj", "model.layers.20.mlp.experts.136.gate_proj", "model.layers.20.mlp.experts.137.gate_proj", "model.layers.20.mlp.experts.138.gate_proj", "model.layers.20.mlp.experts.139.gate_proj", "model.layers.20.mlp.experts.140.gate_proj", "model.layers.20.mlp.experts.141.gate_proj", "model.layers.20.mlp.experts.142.gate_proj", "model.layers.20.mlp.experts.143.gate_proj", "model.layers.20.mlp.experts.144.gate_proj", "model.layers.20.mlp.experts.145.gate_proj", "model.layers.20.mlp.experts.146.gate_proj", "model.layers.20.mlp.experts.147.gate_proj", "model.layers.20.mlp.experts.148.gate_proj", "model.layers.20.mlp.experts.149.gate_proj", "model.layers.20.mlp.experts.150.gate_proj", "model.layers.20.mlp.experts.151.gate_proj", "model.layers.20.mlp.experts.152.gate_proj", "model.layers.20.mlp.experts.153.gate_proj", "model.layers.20.mlp.experts.154.gate_proj", "model.layers.20.mlp.experts.155.gate_proj", "model.layers.20.mlp.experts.156.gate_proj", "model.layers.20.mlp.experts.157.gate_proj", "model.layers.20.mlp.experts.158.gate_proj", "model.layers.20.mlp.experts.159.gate_proj", "model.layers.20.mlp.experts.0.up_proj", "model.layers.20.mlp.experts.1.up_proj", "model.layers.20.mlp.experts.2.up_proj", "model.layers.20.mlp.experts.3.up_proj", "model.layers.20.mlp.experts.4.up_proj", "model.layers.20.mlp.experts.5.up_proj", "model.layers.20.mlp.experts.6.up_proj", "model.layers.20.mlp.experts.7.up_proj", "model.layers.20.mlp.experts.8.up_proj", "model.layers.20.mlp.experts.9.up_proj", "model.layers.20.mlp.experts.10.up_proj", "model.layers.20.mlp.experts.11.up_proj", "model.layers.20.mlp.experts.12.up_proj", "model.layers.20.mlp.experts.13.up_proj", "model.layers.20.mlp.experts.14.up_proj", "model.layers.20.mlp.experts.15.up_proj", "model.layers.20.mlp.experts.16.up_proj", "model.layers.20.mlp.experts.17.up_proj", "model.layers.20.mlp.experts.18.up_proj", "model.layers.20.mlp.experts.19.up_proj", "model.layers.20.mlp.experts.20.up_proj", "model.layers.20.mlp.experts.21.up_proj", "model.layers.20.mlp.experts.22.up_proj", "model.layers.20.mlp.experts.23.up_proj", "model.layers.20.mlp.experts.24.up_proj", "model.layers.20.mlp.experts.25.up_proj", "model.layers.20.mlp.experts.26.up_proj", "model.layers.20.mlp.experts.27.up_proj", "model.layers.20.mlp.experts.28.up_proj", "model.layers.20.mlp.experts.29.up_proj", "model.layers.20.mlp.experts.30.up_proj", "model.layers.20.mlp.experts.31.up_proj", "model.layers.20.mlp.experts.32.up_proj", "model.layers.20.mlp.experts.33.up_proj", "model.layers.20.mlp.experts.34.up_proj", "model.layers.20.mlp.experts.35.up_proj", "model.layers.20.mlp.experts.36.up_proj", "model.layers.20.mlp.experts.37.up_proj", "model.layers.20.mlp.experts.38.up_proj", "model.layers.20.mlp.experts.39.up_proj", "model.layers.20.mlp.experts.40.up_proj", "model.layers.20.mlp.experts.41.up_proj", "model.layers.20.mlp.experts.42.up_proj", "model.layers.20.mlp.experts.43.up_proj", "model.layers.20.mlp.experts.44.up_proj", "model.layers.20.mlp.experts.45.up_proj", "model.layers.20.mlp.experts.46.up_proj", "model.layers.20.mlp.experts.47.up_proj", "model.layers.20.mlp.experts.48.up_proj", "model.layers.20.mlp.experts.49.up_proj", "model.layers.20.mlp.experts.50.up_proj", "model.layers.20.mlp.experts.51.up_proj", "model.layers.20.mlp.experts.52.up_proj", "model.layers.20.mlp.experts.53.up_proj", "model.layers.20.mlp.experts.54.up_proj", "model.layers.20.mlp.experts.55.up_proj", "model.layers.20.mlp.experts.56.up_proj", "model.layers.20.mlp.experts.57.up_proj", "model.layers.20.mlp.experts.58.up_proj", "model.layers.20.mlp.experts.59.up_proj", "model.layers.20.mlp.experts.60.up_proj", "model.layers.20.mlp.experts.61.up_proj", "model.layers.20.mlp.experts.62.up_proj", "model.layers.20.mlp.experts.63.up_proj", "model.layers.20.mlp.experts.64.up_proj", "model.layers.20.mlp.experts.65.up_proj", "model.layers.20.mlp.experts.66.up_proj", "model.layers.20.mlp.experts.67.up_proj", "model.layers.20.mlp.experts.68.up_proj", "model.layers.20.mlp.experts.69.up_proj", "model.layers.20.mlp.experts.70.up_proj", "model.layers.20.mlp.experts.71.up_proj", "model.layers.20.mlp.experts.72.up_proj", "model.layers.20.mlp.experts.73.up_proj", "model.layers.20.mlp.experts.74.up_proj", "model.layers.20.mlp.experts.75.up_proj", "model.layers.20.mlp.experts.76.up_proj", "model.layers.20.mlp.experts.77.up_proj", "model.layers.20.mlp.experts.78.up_proj", "model.layers.20.mlp.experts.79.up_proj", "model.layers.20.mlp.experts.80.up_proj", "model.layers.20.mlp.experts.81.up_proj", "model.layers.20.mlp.experts.82.up_proj", "model.layers.20.mlp.experts.83.up_proj", "model.layers.20.mlp.experts.84.up_proj", "model.layers.20.mlp.experts.85.up_proj", "model.layers.20.mlp.experts.86.up_proj", "model.layers.20.mlp.experts.87.up_proj", "model.layers.20.mlp.experts.88.up_proj", "model.layers.20.mlp.experts.89.up_proj", "model.layers.20.mlp.experts.90.up_proj", "model.layers.20.mlp.experts.91.up_proj", "model.layers.20.mlp.experts.92.up_proj", "model.layers.20.mlp.experts.93.up_proj", "model.layers.20.mlp.experts.94.up_proj", "model.layers.20.mlp.experts.95.up_proj", "model.layers.20.mlp.experts.96.up_proj", "model.layers.20.mlp.experts.97.up_proj", "model.layers.20.mlp.experts.98.up_proj", "model.layers.20.mlp.experts.99.up_proj", "model.layers.20.mlp.experts.100.up_proj", "model.layers.20.mlp.experts.101.up_proj", "model.layers.20.mlp.experts.102.up_proj", "model.layers.20.mlp.experts.103.up_proj", "model.layers.20.mlp.experts.104.up_proj", "model.layers.20.mlp.experts.105.up_proj", "model.layers.20.mlp.experts.106.up_proj", "model.layers.20.mlp.experts.107.up_proj", "model.layers.20.mlp.experts.108.up_proj", "model.layers.20.mlp.experts.109.up_proj", "model.layers.20.mlp.experts.110.up_proj", "model.layers.20.mlp.experts.111.up_proj", "model.layers.20.mlp.experts.112.up_proj", "model.layers.20.mlp.experts.113.up_proj", "model.layers.20.mlp.experts.114.up_proj", "model.layers.20.mlp.experts.115.up_proj", "model.layers.20.mlp.experts.116.up_proj", "model.layers.20.mlp.experts.117.up_proj", "model.layers.20.mlp.experts.118.up_proj", "model.layers.20.mlp.experts.119.up_proj", "model.layers.20.mlp.experts.120.up_proj", "model.layers.20.mlp.experts.121.up_proj", "model.layers.20.mlp.experts.122.up_proj", "model.layers.20.mlp.experts.123.up_proj", "model.layers.20.mlp.experts.124.up_proj", "model.layers.20.mlp.experts.125.up_proj", "model.layers.20.mlp.experts.126.up_proj", "model.layers.20.mlp.experts.127.up_proj", "model.layers.20.mlp.experts.128.up_proj", "model.layers.20.mlp.experts.129.up_proj", "model.layers.20.mlp.experts.130.up_proj", "model.layers.20.mlp.experts.131.up_proj", "model.layers.20.mlp.experts.132.up_proj", "model.layers.20.mlp.experts.133.up_proj", "model.layers.20.mlp.experts.134.up_proj", "model.layers.20.mlp.experts.135.up_proj", "model.layers.20.mlp.experts.136.up_proj", "model.layers.20.mlp.experts.137.up_proj", "model.layers.20.mlp.experts.138.up_proj", "model.layers.20.mlp.experts.139.up_proj", "model.layers.20.mlp.experts.140.up_proj", "model.layers.20.mlp.experts.141.up_proj", "model.layers.20.mlp.experts.142.up_proj", "model.layers.20.mlp.experts.143.up_proj", "model.layers.20.mlp.experts.144.up_proj", "model.layers.20.mlp.experts.145.up_proj", "model.layers.20.mlp.experts.146.up_proj", "model.layers.20.mlp.experts.147.up_proj", "model.layers.20.mlp.experts.148.up_proj", "model.layers.20.mlp.experts.149.up_proj", "model.layers.20.mlp.experts.150.up_proj", "model.layers.20.mlp.experts.151.up_proj", "model.layers.20.mlp.experts.152.up_proj", "model.layers.20.mlp.experts.153.up_proj", "model.layers.20.mlp.experts.154.up_proj", "model.layers.20.mlp.experts.155.up_proj", "model.layers.20.mlp.experts.156.up_proj", "model.layers.20.mlp.experts.157.up_proj", "model.layers.20.mlp.experts.158.up_proj", "model.layers.20.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -0.00011105185840278725, "dbits": 2516582400 }, { "dkld": -0.0001365325413644307, "dbits": 5033164800 } ] }, { "idx": 122, "layers": [ "model.layers.20.mlp.experts.0.down_proj", "model.layers.20.mlp.experts.1.down_proj", "model.layers.20.mlp.experts.2.down_proj", "model.layers.20.mlp.experts.3.down_proj", "model.layers.20.mlp.experts.4.down_proj", "model.layers.20.mlp.experts.5.down_proj", "model.layers.20.mlp.experts.6.down_proj", "model.layers.20.mlp.experts.7.down_proj", "model.layers.20.mlp.experts.8.down_proj", "model.layers.20.mlp.experts.9.down_proj", "model.layers.20.mlp.experts.10.down_proj", "model.layers.20.mlp.experts.11.down_proj", "model.layers.20.mlp.experts.12.down_proj", "model.layers.20.mlp.experts.13.down_proj", "model.layers.20.mlp.experts.14.down_proj", "model.layers.20.mlp.experts.15.down_proj", "model.layers.20.mlp.experts.16.down_proj", "model.layers.20.mlp.experts.17.down_proj", "model.layers.20.mlp.experts.18.down_proj", "model.layers.20.mlp.experts.19.down_proj", "model.layers.20.mlp.experts.20.down_proj", "model.layers.20.mlp.experts.21.down_proj", "model.layers.20.mlp.experts.22.down_proj", "model.layers.20.mlp.experts.23.down_proj", "model.layers.20.mlp.experts.24.down_proj", "model.layers.20.mlp.experts.25.down_proj", "model.layers.20.mlp.experts.26.down_proj", "model.layers.20.mlp.experts.27.down_proj", "model.layers.20.mlp.experts.28.down_proj", "model.layers.20.mlp.experts.29.down_proj", "model.layers.20.mlp.experts.30.down_proj", "model.layers.20.mlp.experts.31.down_proj", "model.layers.20.mlp.experts.32.down_proj", "model.layers.20.mlp.experts.33.down_proj", "model.layers.20.mlp.experts.34.down_proj", "model.layers.20.mlp.experts.35.down_proj", "model.layers.20.mlp.experts.36.down_proj", "model.layers.20.mlp.experts.37.down_proj", "model.layers.20.mlp.experts.38.down_proj", "model.layers.20.mlp.experts.39.down_proj", "model.layers.20.mlp.experts.40.down_proj", "model.layers.20.mlp.experts.41.down_proj", "model.layers.20.mlp.experts.42.down_proj", "model.layers.20.mlp.experts.43.down_proj", "model.layers.20.mlp.experts.44.down_proj", "model.layers.20.mlp.experts.45.down_proj", "model.layers.20.mlp.experts.46.down_proj", "model.layers.20.mlp.experts.47.down_proj", "model.layers.20.mlp.experts.48.down_proj", "model.layers.20.mlp.experts.49.down_proj", "model.layers.20.mlp.experts.50.down_proj", "model.layers.20.mlp.experts.51.down_proj", "model.layers.20.mlp.experts.52.down_proj", "model.layers.20.mlp.experts.53.down_proj", "model.layers.20.mlp.experts.54.down_proj", "model.layers.20.mlp.experts.55.down_proj", "model.layers.20.mlp.experts.56.down_proj", "model.layers.20.mlp.experts.57.down_proj", "model.layers.20.mlp.experts.58.down_proj", "model.layers.20.mlp.experts.59.down_proj", "model.layers.20.mlp.experts.60.down_proj", "model.layers.20.mlp.experts.61.down_proj", "model.layers.20.mlp.experts.62.down_proj", "model.layers.20.mlp.experts.63.down_proj", "model.layers.20.mlp.experts.64.down_proj", "model.layers.20.mlp.experts.65.down_proj", "model.layers.20.mlp.experts.66.down_proj", "model.layers.20.mlp.experts.67.down_proj", "model.layers.20.mlp.experts.68.down_proj", "model.layers.20.mlp.experts.69.down_proj", "model.layers.20.mlp.experts.70.down_proj", "model.layers.20.mlp.experts.71.down_proj", "model.layers.20.mlp.experts.72.down_proj", "model.layers.20.mlp.experts.73.down_proj", "model.layers.20.mlp.experts.74.down_proj", "model.layers.20.mlp.experts.75.down_proj", "model.layers.20.mlp.experts.76.down_proj", "model.layers.20.mlp.experts.77.down_proj", "model.layers.20.mlp.experts.78.down_proj", "model.layers.20.mlp.experts.79.down_proj", "model.layers.20.mlp.experts.80.down_proj", "model.layers.20.mlp.experts.81.down_proj", "model.layers.20.mlp.experts.82.down_proj", "model.layers.20.mlp.experts.83.down_proj", "model.layers.20.mlp.experts.84.down_proj", "model.layers.20.mlp.experts.85.down_proj", "model.layers.20.mlp.experts.86.down_proj", "model.layers.20.mlp.experts.87.down_proj", "model.layers.20.mlp.experts.88.down_proj", "model.layers.20.mlp.experts.89.down_proj", "model.layers.20.mlp.experts.90.down_proj", "model.layers.20.mlp.experts.91.down_proj", "model.layers.20.mlp.experts.92.down_proj", "model.layers.20.mlp.experts.93.down_proj", "model.layers.20.mlp.experts.94.down_proj", "model.layers.20.mlp.experts.95.down_proj", "model.layers.20.mlp.experts.96.down_proj", "model.layers.20.mlp.experts.97.down_proj", "model.layers.20.mlp.experts.98.down_proj", "model.layers.20.mlp.experts.99.down_proj", "model.layers.20.mlp.experts.100.down_proj", "model.layers.20.mlp.experts.101.down_proj", "model.layers.20.mlp.experts.102.down_proj", "model.layers.20.mlp.experts.103.down_proj", "model.layers.20.mlp.experts.104.down_proj", "model.layers.20.mlp.experts.105.down_proj", "model.layers.20.mlp.experts.106.down_proj", "model.layers.20.mlp.experts.107.down_proj", "model.layers.20.mlp.experts.108.down_proj", "model.layers.20.mlp.experts.109.down_proj", "model.layers.20.mlp.experts.110.down_proj", "model.layers.20.mlp.experts.111.down_proj", "model.layers.20.mlp.experts.112.down_proj", "model.layers.20.mlp.experts.113.down_proj", "model.layers.20.mlp.experts.114.down_proj", "model.layers.20.mlp.experts.115.down_proj", "model.layers.20.mlp.experts.116.down_proj", "model.layers.20.mlp.experts.117.down_proj", "model.layers.20.mlp.experts.118.down_proj", "model.layers.20.mlp.experts.119.down_proj", "model.layers.20.mlp.experts.120.down_proj", "model.layers.20.mlp.experts.121.down_proj", "model.layers.20.mlp.experts.122.down_proj", "model.layers.20.mlp.experts.123.down_proj", "model.layers.20.mlp.experts.124.down_proj", "model.layers.20.mlp.experts.125.down_proj", "model.layers.20.mlp.experts.126.down_proj", "model.layers.20.mlp.experts.127.down_proj", "model.layers.20.mlp.experts.128.down_proj", "model.layers.20.mlp.experts.129.down_proj", "model.layers.20.mlp.experts.130.down_proj", "model.layers.20.mlp.experts.131.down_proj", "model.layers.20.mlp.experts.132.down_proj", "model.layers.20.mlp.experts.133.down_proj", "model.layers.20.mlp.experts.134.down_proj", "model.layers.20.mlp.experts.135.down_proj", "model.layers.20.mlp.experts.136.down_proj", "model.layers.20.mlp.experts.137.down_proj", "model.layers.20.mlp.experts.138.down_proj", "model.layers.20.mlp.experts.139.down_proj", "model.layers.20.mlp.experts.140.down_proj", "model.layers.20.mlp.experts.141.down_proj", "model.layers.20.mlp.experts.142.down_proj", "model.layers.20.mlp.experts.143.down_proj", "model.layers.20.mlp.experts.144.down_proj", "model.layers.20.mlp.experts.145.down_proj", "model.layers.20.mlp.experts.146.down_proj", "model.layers.20.mlp.experts.147.down_proj", "model.layers.20.mlp.experts.148.down_proj", "model.layers.20.mlp.experts.149.down_proj", "model.layers.20.mlp.experts.150.down_proj", "model.layers.20.mlp.experts.151.down_proj", "model.layers.20.mlp.experts.152.down_proj", "model.layers.20.mlp.experts.153.down_proj", "model.layers.20.mlp.experts.154.down_proj", "model.layers.20.mlp.experts.155.down_proj", "model.layers.20.mlp.experts.156.down_proj", "model.layers.20.mlp.experts.157.down_proj", "model.layers.20.mlp.experts.158.down_proj", "model.layers.20.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.5562476366758347e-06, "dbits": 1258291200 }, { "dkld": -2.7582445181905182e-05, "dbits": 2516582400 } ] }, { "idx": 123, "layers": [ "model.layers.21.self_attn.q_proj" ], "candidates": [ { "dkld": -5.6376866996287606e-05, "dbits": 62914560 }, { "dkld": -3.994037397205691e-05, "dbits": 125829120 } ] }, { "idx": 124, "layers": [ "model.layers.21.self_attn.k_proj", "model.layers.21.self_attn.v_proj" ], "candidates": [ { "dkld": 4.250130150467227e-05, "dbits": 10485760 }, { "dkld": -4.140466917306081e-05, "dbits": 20971520 } ] }, { "idx": 125, "layers": [ "model.layers.21.self_attn.o_proj" ], "candidates": [ { "dkld": 0.00011060696560889587, "dbits": 62914560 }, { "dkld": 0.00010915109887719293, "dbits": 125829120 } ] }, { "idx": 126, "layers": [ "model.layers.21.mlp.shared_experts.gate_proj", "model.layers.21.mlp.shared_experts.up_proj", "model.layers.21.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 0.00021913477685302565, "dbits": 23592960 }, { "dkld": 0.00017048190347850392, "dbits": 47185920 } ] }, { "idx": 127, "layers": [ "model.layers.21.mlp.experts.0.gate_proj", "model.layers.21.mlp.experts.1.gate_proj", "model.layers.21.mlp.experts.2.gate_proj", "model.layers.21.mlp.experts.3.gate_proj", "model.layers.21.mlp.experts.4.gate_proj", "model.layers.21.mlp.experts.5.gate_proj", "model.layers.21.mlp.experts.6.gate_proj", "model.layers.21.mlp.experts.7.gate_proj", "model.layers.21.mlp.experts.8.gate_proj", "model.layers.21.mlp.experts.9.gate_proj", "model.layers.21.mlp.experts.10.gate_proj", "model.layers.21.mlp.experts.11.gate_proj", "model.layers.21.mlp.experts.12.gate_proj", "model.layers.21.mlp.experts.13.gate_proj", "model.layers.21.mlp.experts.14.gate_proj", "model.layers.21.mlp.experts.15.gate_proj", "model.layers.21.mlp.experts.16.gate_proj", "model.layers.21.mlp.experts.17.gate_proj", "model.layers.21.mlp.experts.18.gate_proj", "model.layers.21.mlp.experts.19.gate_proj", "model.layers.21.mlp.experts.20.gate_proj", "model.layers.21.mlp.experts.21.gate_proj", "model.layers.21.mlp.experts.22.gate_proj", "model.layers.21.mlp.experts.23.gate_proj", "model.layers.21.mlp.experts.24.gate_proj", "model.layers.21.mlp.experts.25.gate_proj", "model.layers.21.mlp.experts.26.gate_proj", "model.layers.21.mlp.experts.27.gate_proj", "model.layers.21.mlp.experts.28.gate_proj", "model.layers.21.mlp.experts.29.gate_proj", "model.layers.21.mlp.experts.30.gate_proj", "model.layers.21.mlp.experts.31.gate_proj", "model.layers.21.mlp.experts.32.gate_proj", "model.layers.21.mlp.experts.33.gate_proj", "model.layers.21.mlp.experts.34.gate_proj", "model.layers.21.mlp.experts.35.gate_proj", "model.layers.21.mlp.experts.36.gate_proj", "model.layers.21.mlp.experts.37.gate_proj", "model.layers.21.mlp.experts.38.gate_proj", "model.layers.21.mlp.experts.39.gate_proj", "model.layers.21.mlp.experts.40.gate_proj", "model.layers.21.mlp.experts.41.gate_proj", "model.layers.21.mlp.experts.42.gate_proj", "model.layers.21.mlp.experts.43.gate_proj", "model.layers.21.mlp.experts.44.gate_proj", "model.layers.21.mlp.experts.45.gate_proj", "model.layers.21.mlp.experts.46.gate_proj", "model.layers.21.mlp.experts.47.gate_proj", "model.layers.21.mlp.experts.48.gate_proj", "model.layers.21.mlp.experts.49.gate_proj", "model.layers.21.mlp.experts.50.gate_proj", "model.layers.21.mlp.experts.51.gate_proj", "model.layers.21.mlp.experts.52.gate_proj", "model.layers.21.mlp.experts.53.gate_proj", "model.layers.21.mlp.experts.54.gate_proj", "model.layers.21.mlp.experts.55.gate_proj", "model.layers.21.mlp.experts.56.gate_proj", "model.layers.21.mlp.experts.57.gate_proj", "model.layers.21.mlp.experts.58.gate_proj", "model.layers.21.mlp.experts.59.gate_proj", "model.layers.21.mlp.experts.60.gate_proj", "model.layers.21.mlp.experts.61.gate_proj", "model.layers.21.mlp.experts.62.gate_proj", "model.layers.21.mlp.experts.63.gate_proj", "model.layers.21.mlp.experts.64.gate_proj", "model.layers.21.mlp.experts.65.gate_proj", "model.layers.21.mlp.experts.66.gate_proj", "model.layers.21.mlp.experts.67.gate_proj", "model.layers.21.mlp.experts.68.gate_proj", "model.layers.21.mlp.experts.69.gate_proj", "model.layers.21.mlp.experts.70.gate_proj", "model.layers.21.mlp.experts.71.gate_proj", "model.layers.21.mlp.experts.72.gate_proj", "model.layers.21.mlp.experts.73.gate_proj", "model.layers.21.mlp.experts.74.gate_proj", "model.layers.21.mlp.experts.75.gate_proj", "model.layers.21.mlp.experts.76.gate_proj", "model.layers.21.mlp.experts.77.gate_proj", "model.layers.21.mlp.experts.78.gate_proj", "model.layers.21.mlp.experts.79.gate_proj", "model.layers.21.mlp.experts.80.gate_proj", "model.layers.21.mlp.experts.81.gate_proj", "model.layers.21.mlp.experts.82.gate_proj", "model.layers.21.mlp.experts.83.gate_proj", "model.layers.21.mlp.experts.84.gate_proj", "model.layers.21.mlp.experts.85.gate_proj", "model.layers.21.mlp.experts.86.gate_proj", "model.layers.21.mlp.experts.87.gate_proj", "model.layers.21.mlp.experts.88.gate_proj", "model.layers.21.mlp.experts.89.gate_proj", "model.layers.21.mlp.experts.90.gate_proj", "model.layers.21.mlp.experts.91.gate_proj", "model.layers.21.mlp.experts.92.gate_proj", "model.layers.21.mlp.experts.93.gate_proj", "model.layers.21.mlp.experts.94.gate_proj", "model.layers.21.mlp.experts.95.gate_proj", "model.layers.21.mlp.experts.96.gate_proj", "model.layers.21.mlp.experts.97.gate_proj", "model.layers.21.mlp.experts.98.gate_proj", "model.layers.21.mlp.experts.99.gate_proj", "model.layers.21.mlp.experts.100.gate_proj", "model.layers.21.mlp.experts.101.gate_proj", "model.layers.21.mlp.experts.102.gate_proj", "model.layers.21.mlp.experts.103.gate_proj", "model.layers.21.mlp.experts.104.gate_proj", "model.layers.21.mlp.experts.105.gate_proj", "model.layers.21.mlp.experts.106.gate_proj", "model.layers.21.mlp.experts.107.gate_proj", "model.layers.21.mlp.experts.108.gate_proj", "model.layers.21.mlp.experts.109.gate_proj", "model.layers.21.mlp.experts.110.gate_proj", "model.layers.21.mlp.experts.111.gate_proj", "model.layers.21.mlp.experts.112.gate_proj", "model.layers.21.mlp.experts.113.gate_proj", "model.layers.21.mlp.experts.114.gate_proj", "model.layers.21.mlp.experts.115.gate_proj", "model.layers.21.mlp.experts.116.gate_proj", "model.layers.21.mlp.experts.117.gate_proj", "model.layers.21.mlp.experts.118.gate_proj", "model.layers.21.mlp.experts.119.gate_proj", "model.layers.21.mlp.experts.120.gate_proj", "model.layers.21.mlp.experts.121.gate_proj", "model.layers.21.mlp.experts.122.gate_proj", "model.layers.21.mlp.experts.123.gate_proj", "model.layers.21.mlp.experts.124.gate_proj", "model.layers.21.mlp.experts.125.gate_proj", "model.layers.21.mlp.experts.126.gate_proj", "model.layers.21.mlp.experts.127.gate_proj", "model.layers.21.mlp.experts.128.gate_proj", "model.layers.21.mlp.experts.129.gate_proj", "model.layers.21.mlp.experts.130.gate_proj", "model.layers.21.mlp.experts.131.gate_proj", "model.layers.21.mlp.experts.132.gate_proj", "model.layers.21.mlp.experts.133.gate_proj", "model.layers.21.mlp.experts.134.gate_proj", "model.layers.21.mlp.experts.135.gate_proj", "model.layers.21.mlp.experts.136.gate_proj", "model.layers.21.mlp.experts.137.gate_proj", "model.layers.21.mlp.experts.138.gate_proj", "model.layers.21.mlp.experts.139.gate_proj", "model.layers.21.mlp.experts.140.gate_proj", "model.layers.21.mlp.experts.141.gate_proj", "model.layers.21.mlp.experts.142.gate_proj", "model.layers.21.mlp.experts.143.gate_proj", "model.layers.21.mlp.experts.144.gate_proj", "model.layers.21.mlp.experts.145.gate_proj", "model.layers.21.mlp.experts.146.gate_proj", "model.layers.21.mlp.experts.147.gate_proj", "model.layers.21.mlp.experts.148.gate_proj", "model.layers.21.mlp.experts.149.gate_proj", "model.layers.21.mlp.experts.150.gate_proj", "model.layers.21.mlp.experts.151.gate_proj", "model.layers.21.mlp.experts.152.gate_proj", "model.layers.21.mlp.experts.153.gate_proj", "model.layers.21.mlp.experts.154.gate_proj", "model.layers.21.mlp.experts.155.gate_proj", "model.layers.21.mlp.experts.156.gate_proj", "model.layers.21.mlp.experts.157.gate_proj", "model.layers.21.mlp.experts.158.gate_proj", "model.layers.21.mlp.experts.159.gate_proj", "model.layers.21.mlp.experts.0.up_proj", "model.layers.21.mlp.experts.1.up_proj", "model.layers.21.mlp.experts.2.up_proj", "model.layers.21.mlp.experts.3.up_proj", "model.layers.21.mlp.experts.4.up_proj", "model.layers.21.mlp.experts.5.up_proj", "model.layers.21.mlp.experts.6.up_proj", "model.layers.21.mlp.experts.7.up_proj", "model.layers.21.mlp.experts.8.up_proj", "model.layers.21.mlp.experts.9.up_proj", "model.layers.21.mlp.experts.10.up_proj", "model.layers.21.mlp.experts.11.up_proj", "model.layers.21.mlp.experts.12.up_proj", "model.layers.21.mlp.experts.13.up_proj", "model.layers.21.mlp.experts.14.up_proj", "model.layers.21.mlp.experts.15.up_proj", "model.layers.21.mlp.experts.16.up_proj", "model.layers.21.mlp.experts.17.up_proj", "model.layers.21.mlp.experts.18.up_proj", "model.layers.21.mlp.experts.19.up_proj", "model.layers.21.mlp.experts.20.up_proj", "model.layers.21.mlp.experts.21.up_proj", "model.layers.21.mlp.experts.22.up_proj", "model.layers.21.mlp.experts.23.up_proj", "model.layers.21.mlp.experts.24.up_proj", "model.layers.21.mlp.experts.25.up_proj", "model.layers.21.mlp.experts.26.up_proj", "model.layers.21.mlp.experts.27.up_proj", "model.layers.21.mlp.experts.28.up_proj", "model.layers.21.mlp.experts.29.up_proj", "model.layers.21.mlp.experts.30.up_proj", "model.layers.21.mlp.experts.31.up_proj", "model.layers.21.mlp.experts.32.up_proj", "model.layers.21.mlp.experts.33.up_proj", "model.layers.21.mlp.experts.34.up_proj", "model.layers.21.mlp.experts.35.up_proj", "model.layers.21.mlp.experts.36.up_proj", "model.layers.21.mlp.experts.37.up_proj", "model.layers.21.mlp.experts.38.up_proj", "model.layers.21.mlp.experts.39.up_proj", "model.layers.21.mlp.experts.40.up_proj", "model.layers.21.mlp.experts.41.up_proj", "model.layers.21.mlp.experts.42.up_proj", "model.layers.21.mlp.experts.43.up_proj", "model.layers.21.mlp.experts.44.up_proj", "model.layers.21.mlp.experts.45.up_proj", "model.layers.21.mlp.experts.46.up_proj", "model.layers.21.mlp.experts.47.up_proj", "model.layers.21.mlp.experts.48.up_proj", "model.layers.21.mlp.experts.49.up_proj", "model.layers.21.mlp.experts.50.up_proj", "model.layers.21.mlp.experts.51.up_proj", "model.layers.21.mlp.experts.52.up_proj", "model.layers.21.mlp.experts.53.up_proj", "model.layers.21.mlp.experts.54.up_proj", "model.layers.21.mlp.experts.55.up_proj", "model.layers.21.mlp.experts.56.up_proj", "model.layers.21.mlp.experts.57.up_proj", "model.layers.21.mlp.experts.58.up_proj", "model.layers.21.mlp.experts.59.up_proj", "model.layers.21.mlp.experts.60.up_proj", "model.layers.21.mlp.experts.61.up_proj", "model.layers.21.mlp.experts.62.up_proj", "model.layers.21.mlp.experts.63.up_proj", "model.layers.21.mlp.experts.64.up_proj", "model.layers.21.mlp.experts.65.up_proj", "model.layers.21.mlp.experts.66.up_proj", "model.layers.21.mlp.experts.67.up_proj", "model.layers.21.mlp.experts.68.up_proj", "model.layers.21.mlp.experts.69.up_proj", "model.layers.21.mlp.experts.70.up_proj", "model.layers.21.mlp.experts.71.up_proj", "model.layers.21.mlp.experts.72.up_proj", "model.layers.21.mlp.experts.73.up_proj", "model.layers.21.mlp.experts.74.up_proj", "model.layers.21.mlp.experts.75.up_proj", "model.layers.21.mlp.experts.76.up_proj", "model.layers.21.mlp.experts.77.up_proj", "model.layers.21.mlp.experts.78.up_proj", "model.layers.21.mlp.experts.79.up_proj", "model.layers.21.mlp.experts.80.up_proj", "model.layers.21.mlp.experts.81.up_proj", "model.layers.21.mlp.experts.82.up_proj", "model.layers.21.mlp.experts.83.up_proj", "model.layers.21.mlp.experts.84.up_proj", "model.layers.21.mlp.experts.85.up_proj", "model.layers.21.mlp.experts.86.up_proj", "model.layers.21.mlp.experts.87.up_proj", "model.layers.21.mlp.experts.88.up_proj", "model.layers.21.mlp.experts.89.up_proj", "model.layers.21.mlp.experts.90.up_proj", "model.layers.21.mlp.experts.91.up_proj", "model.layers.21.mlp.experts.92.up_proj", "model.layers.21.mlp.experts.93.up_proj", "model.layers.21.mlp.experts.94.up_proj", "model.layers.21.mlp.experts.95.up_proj", "model.layers.21.mlp.experts.96.up_proj", "model.layers.21.mlp.experts.97.up_proj", "model.layers.21.mlp.experts.98.up_proj", "model.layers.21.mlp.experts.99.up_proj", "model.layers.21.mlp.experts.100.up_proj", "model.layers.21.mlp.experts.101.up_proj", "model.layers.21.mlp.experts.102.up_proj", "model.layers.21.mlp.experts.103.up_proj", "model.layers.21.mlp.experts.104.up_proj", "model.layers.21.mlp.experts.105.up_proj", "model.layers.21.mlp.experts.106.up_proj", "model.layers.21.mlp.experts.107.up_proj", "model.layers.21.mlp.experts.108.up_proj", "model.layers.21.mlp.experts.109.up_proj", "model.layers.21.mlp.experts.110.up_proj", "model.layers.21.mlp.experts.111.up_proj", "model.layers.21.mlp.experts.112.up_proj", "model.layers.21.mlp.experts.113.up_proj", "model.layers.21.mlp.experts.114.up_proj", "model.layers.21.mlp.experts.115.up_proj", "model.layers.21.mlp.experts.116.up_proj", "model.layers.21.mlp.experts.117.up_proj", "model.layers.21.mlp.experts.118.up_proj", "model.layers.21.mlp.experts.119.up_proj", "model.layers.21.mlp.experts.120.up_proj", "model.layers.21.mlp.experts.121.up_proj", "model.layers.21.mlp.experts.122.up_proj", "model.layers.21.mlp.experts.123.up_proj", "model.layers.21.mlp.experts.124.up_proj", "model.layers.21.mlp.experts.125.up_proj", "model.layers.21.mlp.experts.126.up_proj", "model.layers.21.mlp.experts.127.up_proj", "model.layers.21.mlp.experts.128.up_proj", "model.layers.21.mlp.experts.129.up_proj", "model.layers.21.mlp.experts.130.up_proj", "model.layers.21.mlp.experts.131.up_proj", "model.layers.21.mlp.experts.132.up_proj", "model.layers.21.mlp.experts.133.up_proj", "model.layers.21.mlp.experts.134.up_proj", "model.layers.21.mlp.experts.135.up_proj", "model.layers.21.mlp.experts.136.up_proj", "model.layers.21.mlp.experts.137.up_proj", "model.layers.21.mlp.experts.138.up_proj", "model.layers.21.mlp.experts.139.up_proj", "model.layers.21.mlp.experts.140.up_proj", "model.layers.21.mlp.experts.141.up_proj", "model.layers.21.mlp.experts.142.up_proj", "model.layers.21.mlp.experts.143.up_proj", "model.layers.21.mlp.experts.144.up_proj", "model.layers.21.mlp.experts.145.up_proj", "model.layers.21.mlp.experts.146.up_proj", "model.layers.21.mlp.experts.147.up_proj", "model.layers.21.mlp.experts.148.up_proj", "model.layers.21.mlp.experts.149.up_proj", "model.layers.21.mlp.experts.150.up_proj", "model.layers.21.mlp.experts.151.up_proj", "model.layers.21.mlp.experts.152.up_proj", "model.layers.21.mlp.experts.153.up_proj", "model.layers.21.mlp.experts.154.up_proj", "model.layers.21.mlp.experts.155.up_proj", "model.layers.21.mlp.experts.156.up_proj", "model.layers.21.mlp.experts.157.up_proj", "model.layers.21.mlp.experts.158.up_proj", "model.layers.21.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -9.783317800611188e-05, "dbits": 2516582400 }, { "dkld": -9.405273012816871e-05, "dbits": 5033164800 } ] }, { "idx": 128, "layers": [ "model.layers.21.mlp.experts.0.down_proj", "model.layers.21.mlp.experts.1.down_proj", "model.layers.21.mlp.experts.2.down_proj", "model.layers.21.mlp.experts.3.down_proj", "model.layers.21.mlp.experts.4.down_proj", "model.layers.21.mlp.experts.5.down_proj", "model.layers.21.mlp.experts.6.down_proj", "model.layers.21.mlp.experts.7.down_proj", "model.layers.21.mlp.experts.8.down_proj", "model.layers.21.mlp.experts.9.down_proj", "model.layers.21.mlp.experts.10.down_proj", "model.layers.21.mlp.experts.11.down_proj", "model.layers.21.mlp.experts.12.down_proj", "model.layers.21.mlp.experts.13.down_proj", "model.layers.21.mlp.experts.14.down_proj", "model.layers.21.mlp.experts.15.down_proj", "model.layers.21.mlp.experts.16.down_proj", "model.layers.21.mlp.experts.17.down_proj", "model.layers.21.mlp.experts.18.down_proj", "model.layers.21.mlp.experts.19.down_proj", "model.layers.21.mlp.experts.20.down_proj", "model.layers.21.mlp.experts.21.down_proj", "model.layers.21.mlp.experts.22.down_proj", "model.layers.21.mlp.experts.23.down_proj", "model.layers.21.mlp.experts.24.down_proj", "model.layers.21.mlp.experts.25.down_proj", "model.layers.21.mlp.experts.26.down_proj", "model.layers.21.mlp.experts.27.down_proj", "model.layers.21.mlp.experts.28.down_proj", "model.layers.21.mlp.experts.29.down_proj", "model.layers.21.mlp.experts.30.down_proj", "model.layers.21.mlp.experts.31.down_proj", "model.layers.21.mlp.experts.32.down_proj", "model.layers.21.mlp.experts.33.down_proj", "model.layers.21.mlp.experts.34.down_proj", "model.layers.21.mlp.experts.35.down_proj", "model.layers.21.mlp.experts.36.down_proj", "model.layers.21.mlp.experts.37.down_proj", "model.layers.21.mlp.experts.38.down_proj", "model.layers.21.mlp.experts.39.down_proj", "model.layers.21.mlp.experts.40.down_proj", "model.layers.21.mlp.experts.41.down_proj", "model.layers.21.mlp.experts.42.down_proj", "model.layers.21.mlp.experts.43.down_proj", "model.layers.21.mlp.experts.44.down_proj", "model.layers.21.mlp.experts.45.down_proj", "model.layers.21.mlp.experts.46.down_proj", "model.layers.21.mlp.experts.47.down_proj", "model.layers.21.mlp.experts.48.down_proj", "model.layers.21.mlp.experts.49.down_proj", "model.layers.21.mlp.experts.50.down_proj", "model.layers.21.mlp.experts.51.down_proj", "model.layers.21.mlp.experts.52.down_proj", "model.layers.21.mlp.experts.53.down_proj", "model.layers.21.mlp.experts.54.down_proj", "model.layers.21.mlp.experts.55.down_proj", "model.layers.21.mlp.experts.56.down_proj", "model.layers.21.mlp.experts.57.down_proj", "model.layers.21.mlp.experts.58.down_proj", "model.layers.21.mlp.experts.59.down_proj", "model.layers.21.mlp.experts.60.down_proj", "model.layers.21.mlp.experts.61.down_proj", "model.layers.21.mlp.experts.62.down_proj", "model.layers.21.mlp.experts.63.down_proj", "model.layers.21.mlp.experts.64.down_proj", "model.layers.21.mlp.experts.65.down_proj", "model.layers.21.mlp.experts.66.down_proj", "model.layers.21.mlp.experts.67.down_proj", "model.layers.21.mlp.experts.68.down_proj", "model.layers.21.mlp.experts.69.down_proj", "model.layers.21.mlp.experts.70.down_proj", "model.layers.21.mlp.experts.71.down_proj", "model.layers.21.mlp.experts.72.down_proj", "model.layers.21.mlp.experts.73.down_proj", "model.layers.21.mlp.experts.74.down_proj", "model.layers.21.mlp.experts.75.down_proj", "model.layers.21.mlp.experts.76.down_proj", "model.layers.21.mlp.experts.77.down_proj", "model.layers.21.mlp.experts.78.down_proj", "model.layers.21.mlp.experts.79.down_proj", "model.layers.21.mlp.experts.80.down_proj", "model.layers.21.mlp.experts.81.down_proj", "model.layers.21.mlp.experts.82.down_proj", "model.layers.21.mlp.experts.83.down_proj", "model.layers.21.mlp.experts.84.down_proj", "model.layers.21.mlp.experts.85.down_proj", "model.layers.21.mlp.experts.86.down_proj", "model.layers.21.mlp.experts.87.down_proj", "model.layers.21.mlp.experts.88.down_proj", "model.layers.21.mlp.experts.89.down_proj", "model.layers.21.mlp.experts.90.down_proj", "model.layers.21.mlp.experts.91.down_proj", "model.layers.21.mlp.experts.92.down_proj", "model.layers.21.mlp.experts.93.down_proj", "model.layers.21.mlp.experts.94.down_proj", "model.layers.21.mlp.experts.95.down_proj", "model.layers.21.mlp.experts.96.down_proj", "model.layers.21.mlp.experts.97.down_proj", "model.layers.21.mlp.experts.98.down_proj", "model.layers.21.mlp.experts.99.down_proj", "model.layers.21.mlp.experts.100.down_proj", "model.layers.21.mlp.experts.101.down_proj", "model.layers.21.mlp.experts.102.down_proj", "model.layers.21.mlp.experts.103.down_proj", "model.layers.21.mlp.experts.104.down_proj", "model.layers.21.mlp.experts.105.down_proj", "model.layers.21.mlp.experts.106.down_proj", "model.layers.21.mlp.experts.107.down_proj", "model.layers.21.mlp.experts.108.down_proj", "model.layers.21.mlp.experts.109.down_proj", "model.layers.21.mlp.experts.110.down_proj", "model.layers.21.mlp.experts.111.down_proj", "model.layers.21.mlp.experts.112.down_proj", "model.layers.21.mlp.experts.113.down_proj", "model.layers.21.mlp.experts.114.down_proj", "model.layers.21.mlp.experts.115.down_proj", "model.layers.21.mlp.experts.116.down_proj", "model.layers.21.mlp.experts.117.down_proj", "model.layers.21.mlp.experts.118.down_proj", "model.layers.21.mlp.experts.119.down_proj", "model.layers.21.mlp.experts.120.down_proj", "model.layers.21.mlp.experts.121.down_proj", "model.layers.21.mlp.experts.122.down_proj", "model.layers.21.mlp.experts.123.down_proj", "model.layers.21.mlp.experts.124.down_proj", "model.layers.21.mlp.experts.125.down_proj", "model.layers.21.mlp.experts.126.down_proj", "model.layers.21.mlp.experts.127.down_proj", "model.layers.21.mlp.experts.128.down_proj", "model.layers.21.mlp.experts.129.down_proj", "model.layers.21.mlp.experts.130.down_proj", "model.layers.21.mlp.experts.131.down_proj", "model.layers.21.mlp.experts.132.down_proj", "model.layers.21.mlp.experts.133.down_proj", "model.layers.21.mlp.experts.134.down_proj", "model.layers.21.mlp.experts.135.down_proj", "model.layers.21.mlp.experts.136.down_proj", "model.layers.21.mlp.experts.137.down_proj", "model.layers.21.mlp.experts.138.down_proj", "model.layers.21.mlp.experts.139.down_proj", "model.layers.21.mlp.experts.140.down_proj", "model.layers.21.mlp.experts.141.down_proj", "model.layers.21.mlp.experts.142.down_proj", "model.layers.21.mlp.experts.143.down_proj", "model.layers.21.mlp.experts.144.down_proj", "model.layers.21.mlp.experts.145.down_proj", "model.layers.21.mlp.experts.146.down_proj", "model.layers.21.mlp.experts.147.down_proj", "model.layers.21.mlp.experts.148.down_proj", "model.layers.21.mlp.experts.149.down_proj", "model.layers.21.mlp.experts.150.down_proj", "model.layers.21.mlp.experts.151.down_proj", "model.layers.21.mlp.experts.152.down_proj", "model.layers.21.mlp.experts.153.down_proj", "model.layers.21.mlp.experts.154.down_proj", "model.layers.21.mlp.experts.155.down_proj", "model.layers.21.mlp.experts.156.down_proj", "model.layers.21.mlp.experts.157.down_proj", "model.layers.21.mlp.experts.158.down_proj", "model.layers.21.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -0.0001368091674521562, "dbits": 1258291200 }, { "dkld": -0.00010539989452808957, "dbits": 2516582400 } ] }, { "idx": 129, "layers": [ "model.layers.22.self_attn.q_proj" ], "candidates": [ { "dkld": -3.003717865794793e-05, "dbits": 62914560 }, { "dkld": 5.248747766018608e-06, "dbits": 125829120 } ] }, { "idx": 130, "layers": [ "model.layers.22.self_attn.k_proj", "model.layers.22.self_attn.v_proj" ], "candidates": [ { "dkld": -7.712540682405095e-05, "dbits": 10485760 }, { "dkld": 2.764021046459779e-05, "dbits": 20971520 } ] }, { "idx": 131, "layers": [ "model.layers.22.self_attn.o_proj" ], "candidates": [ { "dkld": 3.84040642529733e-05, "dbits": 62914560 }, { "dkld": 0.00010579689405858586, "dbits": 125829120 } ] }, { "idx": 132, "layers": [ "model.layers.22.mlp.shared_experts.gate_proj", "model.layers.22.mlp.shared_experts.up_proj", "model.layers.22.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 2.7987826615573017e-05, "dbits": 23592960 }, { "dkld": 1.5621795319021095e-05, "dbits": 47185920 } ] }, { "idx": 133, "layers": [ "model.layers.22.mlp.experts.0.gate_proj", "model.layers.22.mlp.experts.1.gate_proj", "model.layers.22.mlp.experts.2.gate_proj", "model.layers.22.mlp.experts.3.gate_proj", "model.layers.22.mlp.experts.4.gate_proj", "model.layers.22.mlp.experts.5.gate_proj", "model.layers.22.mlp.experts.6.gate_proj", "model.layers.22.mlp.experts.7.gate_proj", "model.layers.22.mlp.experts.8.gate_proj", "model.layers.22.mlp.experts.9.gate_proj", "model.layers.22.mlp.experts.10.gate_proj", "model.layers.22.mlp.experts.11.gate_proj", "model.layers.22.mlp.experts.12.gate_proj", "model.layers.22.mlp.experts.13.gate_proj", "model.layers.22.mlp.experts.14.gate_proj", "model.layers.22.mlp.experts.15.gate_proj", "model.layers.22.mlp.experts.16.gate_proj", "model.layers.22.mlp.experts.17.gate_proj", "model.layers.22.mlp.experts.18.gate_proj", "model.layers.22.mlp.experts.19.gate_proj", "model.layers.22.mlp.experts.20.gate_proj", "model.layers.22.mlp.experts.21.gate_proj", "model.layers.22.mlp.experts.22.gate_proj", "model.layers.22.mlp.experts.23.gate_proj", "model.layers.22.mlp.experts.24.gate_proj", "model.layers.22.mlp.experts.25.gate_proj", "model.layers.22.mlp.experts.26.gate_proj", "model.layers.22.mlp.experts.27.gate_proj", "model.layers.22.mlp.experts.28.gate_proj", "model.layers.22.mlp.experts.29.gate_proj", "model.layers.22.mlp.experts.30.gate_proj", "model.layers.22.mlp.experts.31.gate_proj", "model.layers.22.mlp.experts.32.gate_proj", "model.layers.22.mlp.experts.33.gate_proj", "model.layers.22.mlp.experts.34.gate_proj", "model.layers.22.mlp.experts.35.gate_proj", "model.layers.22.mlp.experts.36.gate_proj", "model.layers.22.mlp.experts.37.gate_proj", "model.layers.22.mlp.experts.38.gate_proj", "model.layers.22.mlp.experts.39.gate_proj", "model.layers.22.mlp.experts.40.gate_proj", "model.layers.22.mlp.experts.41.gate_proj", "model.layers.22.mlp.experts.42.gate_proj", "model.layers.22.mlp.experts.43.gate_proj", "model.layers.22.mlp.experts.44.gate_proj", "model.layers.22.mlp.experts.45.gate_proj", "model.layers.22.mlp.experts.46.gate_proj", "model.layers.22.mlp.experts.47.gate_proj", "model.layers.22.mlp.experts.48.gate_proj", "model.layers.22.mlp.experts.49.gate_proj", "model.layers.22.mlp.experts.50.gate_proj", "model.layers.22.mlp.experts.51.gate_proj", "model.layers.22.mlp.experts.52.gate_proj", "model.layers.22.mlp.experts.53.gate_proj", "model.layers.22.mlp.experts.54.gate_proj", "model.layers.22.mlp.experts.55.gate_proj", "model.layers.22.mlp.experts.56.gate_proj", "model.layers.22.mlp.experts.57.gate_proj", "model.layers.22.mlp.experts.58.gate_proj", "model.layers.22.mlp.experts.59.gate_proj", "model.layers.22.mlp.experts.60.gate_proj", "model.layers.22.mlp.experts.61.gate_proj", "model.layers.22.mlp.experts.62.gate_proj", "model.layers.22.mlp.experts.63.gate_proj", "model.layers.22.mlp.experts.64.gate_proj", "model.layers.22.mlp.experts.65.gate_proj", "model.layers.22.mlp.experts.66.gate_proj", "model.layers.22.mlp.experts.67.gate_proj", "model.layers.22.mlp.experts.68.gate_proj", "model.layers.22.mlp.experts.69.gate_proj", "model.layers.22.mlp.experts.70.gate_proj", "model.layers.22.mlp.experts.71.gate_proj", "model.layers.22.mlp.experts.72.gate_proj", "model.layers.22.mlp.experts.73.gate_proj", "model.layers.22.mlp.experts.74.gate_proj", "model.layers.22.mlp.experts.75.gate_proj", "model.layers.22.mlp.experts.76.gate_proj", "model.layers.22.mlp.experts.77.gate_proj", "model.layers.22.mlp.experts.78.gate_proj", "model.layers.22.mlp.experts.79.gate_proj", "model.layers.22.mlp.experts.80.gate_proj", "model.layers.22.mlp.experts.81.gate_proj", "model.layers.22.mlp.experts.82.gate_proj", "model.layers.22.mlp.experts.83.gate_proj", "model.layers.22.mlp.experts.84.gate_proj", "model.layers.22.mlp.experts.85.gate_proj", "model.layers.22.mlp.experts.86.gate_proj", "model.layers.22.mlp.experts.87.gate_proj", "model.layers.22.mlp.experts.88.gate_proj", "model.layers.22.mlp.experts.89.gate_proj", "model.layers.22.mlp.experts.90.gate_proj", "model.layers.22.mlp.experts.91.gate_proj", "model.layers.22.mlp.experts.92.gate_proj", "model.layers.22.mlp.experts.93.gate_proj", "model.layers.22.mlp.experts.94.gate_proj", "model.layers.22.mlp.experts.95.gate_proj", "model.layers.22.mlp.experts.96.gate_proj", "model.layers.22.mlp.experts.97.gate_proj", "model.layers.22.mlp.experts.98.gate_proj", "model.layers.22.mlp.experts.99.gate_proj", "model.layers.22.mlp.experts.100.gate_proj", "model.layers.22.mlp.experts.101.gate_proj", "model.layers.22.mlp.experts.102.gate_proj", "model.layers.22.mlp.experts.103.gate_proj", "model.layers.22.mlp.experts.104.gate_proj", "model.layers.22.mlp.experts.105.gate_proj", "model.layers.22.mlp.experts.106.gate_proj", "model.layers.22.mlp.experts.107.gate_proj", "model.layers.22.mlp.experts.108.gate_proj", "model.layers.22.mlp.experts.109.gate_proj", "model.layers.22.mlp.experts.110.gate_proj", "model.layers.22.mlp.experts.111.gate_proj", "model.layers.22.mlp.experts.112.gate_proj", "model.layers.22.mlp.experts.113.gate_proj", "model.layers.22.mlp.experts.114.gate_proj", "model.layers.22.mlp.experts.115.gate_proj", "model.layers.22.mlp.experts.116.gate_proj", "model.layers.22.mlp.experts.117.gate_proj", "model.layers.22.mlp.experts.118.gate_proj", "model.layers.22.mlp.experts.119.gate_proj", "model.layers.22.mlp.experts.120.gate_proj", "model.layers.22.mlp.experts.121.gate_proj", "model.layers.22.mlp.experts.122.gate_proj", "model.layers.22.mlp.experts.123.gate_proj", "model.layers.22.mlp.experts.124.gate_proj", "model.layers.22.mlp.experts.125.gate_proj", "model.layers.22.mlp.experts.126.gate_proj", "model.layers.22.mlp.experts.127.gate_proj", "model.layers.22.mlp.experts.128.gate_proj", "model.layers.22.mlp.experts.129.gate_proj", "model.layers.22.mlp.experts.130.gate_proj", "model.layers.22.mlp.experts.131.gate_proj", "model.layers.22.mlp.experts.132.gate_proj", "model.layers.22.mlp.experts.133.gate_proj", "model.layers.22.mlp.experts.134.gate_proj", "model.layers.22.mlp.experts.135.gate_proj", "model.layers.22.mlp.experts.136.gate_proj", "model.layers.22.mlp.experts.137.gate_proj", "model.layers.22.mlp.experts.138.gate_proj", "model.layers.22.mlp.experts.139.gate_proj", "model.layers.22.mlp.experts.140.gate_proj", "model.layers.22.mlp.experts.141.gate_proj", "model.layers.22.mlp.experts.142.gate_proj", "model.layers.22.mlp.experts.143.gate_proj", "model.layers.22.mlp.experts.144.gate_proj", "model.layers.22.mlp.experts.145.gate_proj", "model.layers.22.mlp.experts.146.gate_proj", "model.layers.22.mlp.experts.147.gate_proj", "model.layers.22.mlp.experts.148.gate_proj", "model.layers.22.mlp.experts.149.gate_proj", "model.layers.22.mlp.experts.150.gate_proj", "model.layers.22.mlp.experts.151.gate_proj", "model.layers.22.mlp.experts.152.gate_proj", "model.layers.22.mlp.experts.153.gate_proj", "model.layers.22.mlp.experts.154.gate_proj", "model.layers.22.mlp.experts.155.gate_proj", "model.layers.22.mlp.experts.156.gate_proj", "model.layers.22.mlp.experts.157.gate_proj", "model.layers.22.mlp.experts.158.gate_proj", "model.layers.22.mlp.experts.159.gate_proj", "model.layers.22.mlp.experts.0.up_proj", "model.layers.22.mlp.experts.1.up_proj", "model.layers.22.mlp.experts.2.up_proj", "model.layers.22.mlp.experts.3.up_proj", "model.layers.22.mlp.experts.4.up_proj", "model.layers.22.mlp.experts.5.up_proj", "model.layers.22.mlp.experts.6.up_proj", "model.layers.22.mlp.experts.7.up_proj", "model.layers.22.mlp.experts.8.up_proj", "model.layers.22.mlp.experts.9.up_proj", "model.layers.22.mlp.experts.10.up_proj", "model.layers.22.mlp.experts.11.up_proj", "model.layers.22.mlp.experts.12.up_proj", "model.layers.22.mlp.experts.13.up_proj", "model.layers.22.mlp.experts.14.up_proj", "model.layers.22.mlp.experts.15.up_proj", "model.layers.22.mlp.experts.16.up_proj", "model.layers.22.mlp.experts.17.up_proj", "model.layers.22.mlp.experts.18.up_proj", "model.layers.22.mlp.experts.19.up_proj", "model.layers.22.mlp.experts.20.up_proj", "model.layers.22.mlp.experts.21.up_proj", "model.layers.22.mlp.experts.22.up_proj", "model.layers.22.mlp.experts.23.up_proj", "model.layers.22.mlp.experts.24.up_proj", "model.layers.22.mlp.experts.25.up_proj", "model.layers.22.mlp.experts.26.up_proj", "model.layers.22.mlp.experts.27.up_proj", "model.layers.22.mlp.experts.28.up_proj", "model.layers.22.mlp.experts.29.up_proj", "model.layers.22.mlp.experts.30.up_proj", "model.layers.22.mlp.experts.31.up_proj", "model.layers.22.mlp.experts.32.up_proj", "model.layers.22.mlp.experts.33.up_proj", "model.layers.22.mlp.experts.34.up_proj", "model.layers.22.mlp.experts.35.up_proj", "model.layers.22.mlp.experts.36.up_proj", "model.layers.22.mlp.experts.37.up_proj", "model.layers.22.mlp.experts.38.up_proj", "model.layers.22.mlp.experts.39.up_proj", "model.layers.22.mlp.experts.40.up_proj", "model.layers.22.mlp.experts.41.up_proj", "model.layers.22.mlp.experts.42.up_proj", "model.layers.22.mlp.experts.43.up_proj", "model.layers.22.mlp.experts.44.up_proj", "model.layers.22.mlp.experts.45.up_proj", "model.layers.22.mlp.experts.46.up_proj", "model.layers.22.mlp.experts.47.up_proj", "model.layers.22.mlp.experts.48.up_proj", "model.layers.22.mlp.experts.49.up_proj", "model.layers.22.mlp.experts.50.up_proj", "model.layers.22.mlp.experts.51.up_proj", "model.layers.22.mlp.experts.52.up_proj", "model.layers.22.mlp.experts.53.up_proj", "model.layers.22.mlp.experts.54.up_proj", "model.layers.22.mlp.experts.55.up_proj", "model.layers.22.mlp.experts.56.up_proj", "model.layers.22.mlp.experts.57.up_proj", "model.layers.22.mlp.experts.58.up_proj", "model.layers.22.mlp.experts.59.up_proj", "model.layers.22.mlp.experts.60.up_proj", "model.layers.22.mlp.experts.61.up_proj", "model.layers.22.mlp.experts.62.up_proj", "model.layers.22.mlp.experts.63.up_proj", "model.layers.22.mlp.experts.64.up_proj", "model.layers.22.mlp.experts.65.up_proj", "model.layers.22.mlp.experts.66.up_proj", "model.layers.22.mlp.experts.67.up_proj", "model.layers.22.mlp.experts.68.up_proj", "model.layers.22.mlp.experts.69.up_proj", "model.layers.22.mlp.experts.70.up_proj", "model.layers.22.mlp.experts.71.up_proj", "model.layers.22.mlp.experts.72.up_proj", "model.layers.22.mlp.experts.73.up_proj", "model.layers.22.mlp.experts.74.up_proj", "model.layers.22.mlp.experts.75.up_proj", "model.layers.22.mlp.experts.76.up_proj", "model.layers.22.mlp.experts.77.up_proj", "model.layers.22.mlp.experts.78.up_proj", "model.layers.22.mlp.experts.79.up_proj", "model.layers.22.mlp.experts.80.up_proj", "model.layers.22.mlp.experts.81.up_proj", "model.layers.22.mlp.experts.82.up_proj", "model.layers.22.mlp.experts.83.up_proj", "model.layers.22.mlp.experts.84.up_proj", "model.layers.22.mlp.experts.85.up_proj", "model.layers.22.mlp.experts.86.up_proj", "model.layers.22.mlp.experts.87.up_proj", "model.layers.22.mlp.experts.88.up_proj", "model.layers.22.mlp.experts.89.up_proj", "model.layers.22.mlp.experts.90.up_proj", "model.layers.22.mlp.experts.91.up_proj", "model.layers.22.mlp.experts.92.up_proj", "model.layers.22.mlp.experts.93.up_proj", "model.layers.22.mlp.experts.94.up_proj", "model.layers.22.mlp.experts.95.up_proj", "model.layers.22.mlp.experts.96.up_proj", "model.layers.22.mlp.experts.97.up_proj", "model.layers.22.mlp.experts.98.up_proj", "model.layers.22.mlp.experts.99.up_proj", "model.layers.22.mlp.experts.100.up_proj", "model.layers.22.mlp.experts.101.up_proj", "model.layers.22.mlp.experts.102.up_proj", "model.layers.22.mlp.experts.103.up_proj", "model.layers.22.mlp.experts.104.up_proj", "model.layers.22.mlp.experts.105.up_proj", "model.layers.22.mlp.experts.106.up_proj", "model.layers.22.mlp.experts.107.up_proj", "model.layers.22.mlp.experts.108.up_proj", "model.layers.22.mlp.experts.109.up_proj", "model.layers.22.mlp.experts.110.up_proj", "model.layers.22.mlp.experts.111.up_proj", "model.layers.22.mlp.experts.112.up_proj", "model.layers.22.mlp.experts.113.up_proj", "model.layers.22.mlp.experts.114.up_proj", "model.layers.22.mlp.experts.115.up_proj", "model.layers.22.mlp.experts.116.up_proj", "model.layers.22.mlp.experts.117.up_proj", "model.layers.22.mlp.experts.118.up_proj", "model.layers.22.mlp.experts.119.up_proj", "model.layers.22.mlp.experts.120.up_proj", "model.layers.22.mlp.experts.121.up_proj", "model.layers.22.mlp.experts.122.up_proj", "model.layers.22.mlp.experts.123.up_proj", "model.layers.22.mlp.experts.124.up_proj", "model.layers.22.mlp.experts.125.up_proj", "model.layers.22.mlp.experts.126.up_proj", "model.layers.22.mlp.experts.127.up_proj", "model.layers.22.mlp.experts.128.up_proj", "model.layers.22.mlp.experts.129.up_proj", "model.layers.22.mlp.experts.130.up_proj", "model.layers.22.mlp.experts.131.up_proj", "model.layers.22.mlp.experts.132.up_proj", "model.layers.22.mlp.experts.133.up_proj", "model.layers.22.mlp.experts.134.up_proj", "model.layers.22.mlp.experts.135.up_proj", "model.layers.22.mlp.experts.136.up_proj", "model.layers.22.mlp.experts.137.up_proj", "model.layers.22.mlp.experts.138.up_proj", "model.layers.22.mlp.experts.139.up_proj", "model.layers.22.mlp.experts.140.up_proj", "model.layers.22.mlp.experts.141.up_proj", "model.layers.22.mlp.experts.142.up_proj", "model.layers.22.mlp.experts.143.up_proj", "model.layers.22.mlp.experts.144.up_proj", "model.layers.22.mlp.experts.145.up_proj", "model.layers.22.mlp.experts.146.up_proj", "model.layers.22.mlp.experts.147.up_proj", "model.layers.22.mlp.experts.148.up_proj", "model.layers.22.mlp.experts.149.up_proj", "model.layers.22.mlp.experts.150.up_proj", "model.layers.22.mlp.experts.151.up_proj", "model.layers.22.mlp.experts.152.up_proj", "model.layers.22.mlp.experts.153.up_proj", "model.layers.22.mlp.experts.154.up_proj", "model.layers.22.mlp.experts.155.up_proj", "model.layers.22.mlp.experts.156.up_proj", "model.layers.22.mlp.experts.157.up_proj", "model.layers.22.mlp.experts.158.up_proj", "model.layers.22.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -6.688504945486645e-05, "dbits": 2516582400 }, { "dkld": -0.00012273264583200112, "dbits": 5033164800 } ] }, { "idx": 134, "layers": [ "model.layers.22.mlp.experts.0.down_proj", "model.layers.22.mlp.experts.1.down_proj", "model.layers.22.mlp.experts.2.down_proj", "model.layers.22.mlp.experts.3.down_proj", "model.layers.22.mlp.experts.4.down_proj", "model.layers.22.mlp.experts.5.down_proj", "model.layers.22.mlp.experts.6.down_proj", "model.layers.22.mlp.experts.7.down_proj", "model.layers.22.mlp.experts.8.down_proj", "model.layers.22.mlp.experts.9.down_proj", "model.layers.22.mlp.experts.10.down_proj", "model.layers.22.mlp.experts.11.down_proj", "model.layers.22.mlp.experts.12.down_proj", "model.layers.22.mlp.experts.13.down_proj", "model.layers.22.mlp.experts.14.down_proj", "model.layers.22.mlp.experts.15.down_proj", "model.layers.22.mlp.experts.16.down_proj", "model.layers.22.mlp.experts.17.down_proj", "model.layers.22.mlp.experts.18.down_proj", "model.layers.22.mlp.experts.19.down_proj", "model.layers.22.mlp.experts.20.down_proj", "model.layers.22.mlp.experts.21.down_proj", "model.layers.22.mlp.experts.22.down_proj", "model.layers.22.mlp.experts.23.down_proj", "model.layers.22.mlp.experts.24.down_proj", "model.layers.22.mlp.experts.25.down_proj", "model.layers.22.mlp.experts.26.down_proj", "model.layers.22.mlp.experts.27.down_proj", "model.layers.22.mlp.experts.28.down_proj", "model.layers.22.mlp.experts.29.down_proj", "model.layers.22.mlp.experts.30.down_proj", "model.layers.22.mlp.experts.31.down_proj", "model.layers.22.mlp.experts.32.down_proj", "model.layers.22.mlp.experts.33.down_proj", "model.layers.22.mlp.experts.34.down_proj", "model.layers.22.mlp.experts.35.down_proj", "model.layers.22.mlp.experts.36.down_proj", "model.layers.22.mlp.experts.37.down_proj", "model.layers.22.mlp.experts.38.down_proj", "model.layers.22.mlp.experts.39.down_proj", "model.layers.22.mlp.experts.40.down_proj", "model.layers.22.mlp.experts.41.down_proj", "model.layers.22.mlp.experts.42.down_proj", "model.layers.22.mlp.experts.43.down_proj", "model.layers.22.mlp.experts.44.down_proj", "model.layers.22.mlp.experts.45.down_proj", "model.layers.22.mlp.experts.46.down_proj", "model.layers.22.mlp.experts.47.down_proj", "model.layers.22.mlp.experts.48.down_proj", "model.layers.22.mlp.experts.49.down_proj", "model.layers.22.mlp.experts.50.down_proj", "model.layers.22.mlp.experts.51.down_proj", "model.layers.22.mlp.experts.52.down_proj", "model.layers.22.mlp.experts.53.down_proj", "model.layers.22.mlp.experts.54.down_proj", "model.layers.22.mlp.experts.55.down_proj", "model.layers.22.mlp.experts.56.down_proj", "model.layers.22.mlp.experts.57.down_proj", "model.layers.22.mlp.experts.58.down_proj", "model.layers.22.mlp.experts.59.down_proj", "model.layers.22.mlp.experts.60.down_proj", "model.layers.22.mlp.experts.61.down_proj", "model.layers.22.mlp.experts.62.down_proj", "model.layers.22.mlp.experts.63.down_proj", "model.layers.22.mlp.experts.64.down_proj", "model.layers.22.mlp.experts.65.down_proj", "model.layers.22.mlp.experts.66.down_proj", "model.layers.22.mlp.experts.67.down_proj", "model.layers.22.mlp.experts.68.down_proj", "model.layers.22.mlp.experts.69.down_proj", "model.layers.22.mlp.experts.70.down_proj", "model.layers.22.mlp.experts.71.down_proj", "model.layers.22.mlp.experts.72.down_proj", "model.layers.22.mlp.experts.73.down_proj", "model.layers.22.mlp.experts.74.down_proj", "model.layers.22.mlp.experts.75.down_proj", "model.layers.22.mlp.experts.76.down_proj", "model.layers.22.mlp.experts.77.down_proj", "model.layers.22.mlp.experts.78.down_proj", "model.layers.22.mlp.experts.79.down_proj", "model.layers.22.mlp.experts.80.down_proj", "model.layers.22.mlp.experts.81.down_proj", "model.layers.22.mlp.experts.82.down_proj", "model.layers.22.mlp.experts.83.down_proj", "model.layers.22.mlp.experts.84.down_proj", "model.layers.22.mlp.experts.85.down_proj", "model.layers.22.mlp.experts.86.down_proj", "model.layers.22.mlp.experts.87.down_proj", "model.layers.22.mlp.experts.88.down_proj", "model.layers.22.mlp.experts.89.down_proj", "model.layers.22.mlp.experts.90.down_proj", "model.layers.22.mlp.experts.91.down_proj", "model.layers.22.mlp.experts.92.down_proj", "model.layers.22.mlp.experts.93.down_proj", "model.layers.22.mlp.experts.94.down_proj", "model.layers.22.mlp.experts.95.down_proj", "model.layers.22.mlp.experts.96.down_proj", "model.layers.22.mlp.experts.97.down_proj", "model.layers.22.mlp.experts.98.down_proj", "model.layers.22.mlp.experts.99.down_proj", "model.layers.22.mlp.experts.100.down_proj", "model.layers.22.mlp.experts.101.down_proj", "model.layers.22.mlp.experts.102.down_proj", "model.layers.22.mlp.experts.103.down_proj", "model.layers.22.mlp.experts.104.down_proj", "model.layers.22.mlp.experts.105.down_proj", "model.layers.22.mlp.experts.106.down_proj", "model.layers.22.mlp.experts.107.down_proj", "model.layers.22.mlp.experts.108.down_proj", "model.layers.22.mlp.experts.109.down_proj", "model.layers.22.mlp.experts.110.down_proj", "model.layers.22.mlp.experts.111.down_proj", "model.layers.22.mlp.experts.112.down_proj", "model.layers.22.mlp.experts.113.down_proj", "model.layers.22.mlp.experts.114.down_proj", "model.layers.22.mlp.experts.115.down_proj", "model.layers.22.mlp.experts.116.down_proj", "model.layers.22.mlp.experts.117.down_proj", "model.layers.22.mlp.experts.118.down_proj", "model.layers.22.mlp.experts.119.down_proj", "model.layers.22.mlp.experts.120.down_proj", "model.layers.22.mlp.experts.121.down_proj", "model.layers.22.mlp.experts.122.down_proj", "model.layers.22.mlp.experts.123.down_proj", "model.layers.22.mlp.experts.124.down_proj", "model.layers.22.mlp.experts.125.down_proj", "model.layers.22.mlp.experts.126.down_proj", "model.layers.22.mlp.experts.127.down_proj", "model.layers.22.mlp.experts.128.down_proj", "model.layers.22.mlp.experts.129.down_proj", "model.layers.22.mlp.experts.130.down_proj", "model.layers.22.mlp.experts.131.down_proj", "model.layers.22.mlp.experts.132.down_proj", "model.layers.22.mlp.experts.133.down_proj", "model.layers.22.mlp.experts.134.down_proj", "model.layers.22.mlp.experts.135.down_proj", "model.layers.22.mlp.experts.136.down_proj", "model.layers.22.mlp.experts.137.down_proj", "model.layers.22.mlp.experts.138.down_proj", "model.layers.22.mlp.experts.139.down_proj", "model.layers.22.mlp.experts.140.down_proj", "model.layers.22.mlp.experts.141.down_proj", "model.layers.22.mlp.experts.142.down_proj", "model.layers.22.mlp.experts.143.down_proj", "model.layers.22.mlp.experts.144.down_proj", "model.layers.22.mlp.experts.145.down_proj", "model.layers.22.mlp.experts.146.down_proj", "model.layers.22.mlp.experts.147.down_proj", "model.layers.22.mlp.experts.148.down_proj", "model.layers.22.mlp.experts.149.down_proj", "model.layers.22.mlp.experts.150.down_proj", "model.layers.22.mlp.experts.151.down_proj", "model.layers.22.mlp.experts.152.down_proj", "model.layers.22.mlp.experts.153.down_proj", "model.layers.22.mlp.experts.154.down_proj", "model.layers.22.mlp.experts.155.down_proj", "model.layers.22.mlp.experts.156.down_proj", "model.layers.22.mlp.experts.157.down_proj", "model.layers.22.mlp.experts.158.down_proj", "model.layers.22.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -8.041767869144609e-05, "dbits": 1258291200 }, { "dkld": -6.706963758915628e-05, "dbits": 2516582400 } ] }, { "idx": 135, "layers": [ "model.layers.23.self_attn.q_proj" ], "candidates": [ { "dkld": -4.4688046909867676e-05, "dbits": 62914560 }, { "dkld": -1.4548655599355698e-05, "dbits": 125829120 } ] }, { "idx": 136, "layers": [ "model.layers.23.self_attn.k_proj", "model.layers.23.self_attn.v_proj" ], "candidates": [ { "dkld": -9.862447623163427e-05, "dbits": 10485760 }, { "dkld": -3.7379749119281075e-05, "dbits": 20971520 } ] }, { "idx": 137, "layers": [ "model.layers.23.self_attn.o_proj" ], "candidates": [ { "dkld": 7.719078566879173e-05, "dbits": 62914560 }, { "dkld": 7.599720265716314e-05, "dbits": 125829120 } ] }, { "idx": 138, "layers": [ "model.layers.23.mlp.shared_experts.gate_proj", "model.layers.23.mlp.shared_experts.up_proj", "model.layers.23.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -9.214796591550112e-05, "dbits": 23592960 }, { "dkld": -5.196698475629091e-05, "dbits": 47185920 } ] }, { "idx": 139, "layers": [ "model.layers.23.mlp.experts.0.gate_proj", "model.layers.23.mlp.experts.1.gate_proj", "model.layers.23.mlp.experts.2.gate_proj", "model.layers.23.mlp.experts.3.gate_proj", "model.layers.23.mlp.experts.4.gate_proj", "model.layers.23.mlp.experts.5.gate_proj", "model.layers.23.mlp.experts.6.gate_proj", "model.layers.23.mlp.experts.7.gate_proj", "model.layers.23.mlp.experts.8.gate_proj", "model.layers.23.mlp.experts.9.gate_proj", "model.layers.23.mlp.experts.10.gate_proj", "model.layers.23.mlp.experts.11.gate_proj", "model.layers.23.mlp.experts.12.gate_proj", "model.layers.23.mlp.experts.13.gate_proj", "model.layers.23.mlp.experts.14.gate_proj", "model.layers.23.mlp.experts.15.gate_proj", "model.layers.23.mlp.experts.16.gate_proj", "model.layers.23.mlp.experts.17.gate_proj", "model.layers.23.mlp.experts.18.gate_proj", "model.layers.23.mlp.experts.19.gate_proj", "model.layers.23.mlp.experts.20.gate_proj", "model.layers.23.mlp.experts.21.gate_proj", "model.layers.23.mlp.experts.22.gate_proj", "model.layers.23.mlp.experts.23.gate_proj", "model.layers.23.mlp.experts.24.gate_proj", "model.layers.23.mlp.experts.25.gate_proj", "model.layers.23.mlp.experts.26.gate_proj", "model.layers.23.mlp.experts.27.gate_proj", "model.layers.23.mlp.experts.28.gate_proj", "model.layers.23.mlp.experts.29.gate_proj", "model.layers.23.mlp.experts.30.gate_proj", "model.layers.23.mlp.experts.31.gate_proj", "model.layers.23.mlp.experts.32.gate_proj", "model.layers.23.mlp.experts.33.gate_proj", "model.layers.23.mlp.experts.34.gate_proj", "model.layers.23.mlp.experts.35.gate_proj", "model.layers.23.mlp.experts.36.gate_proj", "model.layers.23.mlp.experts.37.gate_proj", "model.layers.23.mlp.experts.38.gate_proj", "model.layers.23.mlp.experts.39.gate_proj", "model.layers.23.mlp.experts.40.gate_proj", "model.layers.23.mlp.experts.41.gate_proj", "model.layers.23.mlp.experts.42.gate_proj", "model.layers.23.mlp.experts.43.gate_proj", "model.layers.23.mlp.experts.44.gate_proj", "model.layers.23.mlp.experts.45.gate_proj", "model.layers.23.mlp.experts.46.gate_proj", "model.layers.23.mlp.experts.47.gate_proj", "model.layers.23.mlp.experts.48.gate_proj", "model.layers.23.mlp.experts.49.gate_proj", "model.layers.23.mlp.experts.50.gate_proj", "model.layers.23.mlp.experts.51.gate_proj", "model.layers.23.mlp.experts.52.gate_proj", "model.layers.23.mlp.experts.53.gate_proj", "model.layers.23.mlp.experts.54.gate_proj", "model.layers.23.mlp.experts.55.gate_proj", "model.layers.23.mlp.experts.56.gate_proj", "model.layers.23.mlp.experts.57.gate_proj", "model.layers.23.mlp.experts.58.gate_proj", "model.layers.23.mlp.experts.59.gate_proj", "model.layers.23.mlp.experts.60.gate_proj", "model.layers.23.mlp.experts.61.gate_proj", "model.layers.23.mlp.experts.62.gate_proj", "model.layers.23.mlp.experts.63.gate_proj", "model.layers.23.mlp.experts.64.gate_proj", "model.layers.23.mlp.experts.65.gate_proj", "model.layers.23.mlp.experts.66.gate_proj", "model.layers.23.mlp.experts.67.gate_proj", "model.layers.23.mlp.experts.68.gate_proj", "model.layers.23.mlp.experts.69.gate_proj", "model.layers.23.mlp.experts.70.gate_proj", "model.layers.23.mlp.experts.71.gate_proj", "model.layers.23.mlp.experts.72.gate_proj", "model.layers.23.mlp.experts.73.gate_proj", "model.layers.23.mlp.experts.74.gate_proj", "model.layers.23.mlp.experts.75.gate_proj", "model.layers.23.mlp.experts.76.gate_proj", "model.layers.23.mlp.experts.77.gate_proj", "model.layers.23.mlp.experts.78.gate_proj", "model.layers.23.mlp.experts.79.gate_proj", "model.layers.23.mlp.experts.80.gate_proj", "model.layers.23.mlp.experts.81.gate_proj", "model.layers.23.mlp.experts.82.gate_proj", "model.layers.23.mlp.experts.83.gate_proj", "model.layers.23.mlp.experts.84.gate_proj", "model.layers.23.mlp.experts.85.gate_proj", "model.layers.23.mlp.experts.86.gate_proj", "model.layers.23.mlp.experts.87.gate_proj", "model.layers.23.mlp.experts.88.gate_proj", "model.layers.23.mlp.experts.89.gate_proj", "model.layers.23.mlp.experts.90.gate_proj", "model.layers.23.mlp.experts.91.gate_proj", "model.layers.23.mlp.experts.92.gate_proj", "model.layers.23.mlp.experts.93.gate_proj", "model.layers.23.mlp.experts.94.gate_proj", "model.layers.23.mlp.experts.95.gate_proj", "model.layers.23.mlp.experts.96.gate_proj", "model.layers.23.mlp.experts.97.gate_proj", "model.layers.23.mlp.experts.98.gate_proj", "model.layers.23.mlp.experts.99.gate_proj", "model.layers.23.mlp.experts.100.gate_proj", "model.layers.23.mlp.experts.101.gate_proj", "model.layers.23.mlp.experts.102.gate_proj", "model.layers.23.mlp.experts.103.gate_proj", "model.layers.23.mlp.experts.104.gate_proj", "model.layers.23.mlp.experts.105.gate_proj", "model.layers.23.mlp.experts.106.gate_proj", "model.layers.23.mlp.experts.107.gate_proj", "model.layers.23.mlp.experts.108.gate_proj", "model.layers.23.mlp.experts.109.gate_proj", "model.layers.23.mlp.experts.110.gate_proj", "model.layers.23.mlp.experts.111.gate_proj", "model.layers.23.mlp.experts.112.gate_proj", "model.layers.23.mlp.experts.113.gate_proj", "model.layers.23.mlp.experts.114.gate_proj", "model.layers.23.mlp.experts.115.gate_proj", "model.layers.23.mlp.experts.116.gate_proj", "model.layers.23.mlp.experts.117.gate_proj", "model.layers.23.mlp.experts.118.gate_proj", "model.layers.23.mlp.experts.119.gate_proj", "model.layers.23.mlp.experts.120.gate_proj", "model.layers.23.mlp.experts.121.gate_proj", "model.layers.23.mlp.experts.122.gate_proj", "model.layers.23.mlp.experts.123.gate_proj", "model.layers.23.mlp.experts.124.gate_proj", "model.layers.23.mlp.experts.125.gate_proj", "model.layers.23.mlp.experts.126.gate_proj", "model.layers.23.mlp.experts.127.gate_proj", "model.layers.23.mlp.experts.128.gate_proj", "model.layers.23.mlp.experts.129.gate_proj", "model.layers.23.mlp.experts.130.gate_proj", "model.layers.23.mlp.experts.131.gate_proj", "model.layers.23.mlp.experts.132.gate_proj", "model.layers.23.mlp.experts.133.gate_proj", "model.layers.23.mlp.experts.134.gate_proj", "model.layers.23.mlp.experts.135.gate_proj", "model.layers.23.mlp.experts.136.gate_proj", "model.layers.23.mlp.experts.137.gate_proj", "model.layers.23.mlp.experts.138.gate_proj", "model.layers.23.mlp.experts.139.gate_proj", "model.layers.23.mlp.experts.140.gate_proj", "model.layers.23.mlp.experts.141.gate_proj", "model.layers.23.mlp.experts.142.gate_proj", "model.layers.23.mlp.experts.143.gate_proj", "model.layers.23.mlp.experts.144.gate_proj", "model.layers.23.mlp.experts.145.gate_proj", "model.layers.23.mlp.experts.146.gate_proj", "model.layers.23.mlp.experts.147.gate_proj", "model.layers.23.mlp.experts.148.gate_proj", "model.layers.23.mlp.experts.149.gate_proj", "model.layers.23.mlp.experts.150.gate_proj", "model.layers.23.mlp.experts.151.gate_proj", "model.layers.23.mlp.experts.152.gate_proj", "model.layers.23.mlp.experts.153.gate_proj", "model.layers.23.mlp.experts.154.gate_proj", "model.layers.23.mlp.experts.155.gate_proj", "model.layers.23.mlp.experts.156.gate_proj", "model.layers.23.mlp.experts.157.gate_proj", "model.layers.23.mlp.experts.158.gate_proj", "model.layers.23.mlp.experts.159.gate_proj", "model.layers.23.mlp.experts.0.up_proj", "model.layers.23.mlp.experts.1.up_proj", "model.layers.23.mlp.experts.2.up_proj", "model.layers.23.mlp.experts.3.up_proj", "model.layers.23.mlp.experts.4.up_proj", "model.layers.23.mlp.experts.5.up_proj", "model.layers.23.mlp.experts.6.up_proj", "model.layers.23.mlp.experts.7.up_proj", "model.layers.23.mlp.experts.8.up_proj", "model.layers.23.mlp.experts.9.up_proj", "model.layers.23.mlp.experts.10.up_proj", "model.layers.23.mlp.experts.11.up_proj", "model.layers.23.mlp.experts.12.up_proj", "model.layers.23.mlp.experts.13.up_proj", "model.layers.23.mlp.experts.14.up_proj", "model.layers.23.mlp.experts.15.up_proj", "model.layers.23.mlp.experts.16.up_proj", "model.layers.23.mlp.experts.17.up_proj", "model.layers.23.mlp.experts.18.up_proj", "model.layers.23.mlp.experts.19.up_proj", "model.layers.23.mlp.experts.20.up_proj", "model.layers.23.mlp.experts.21.up_proj", "model.layers.23.mlp.experts.22.up_proj", "model.layers.23.mlp.experts.23.up_proj", "model.layers.23.mlp.experts.24.up_proj", "model.layers.23.mlp.experts.25.up_proj", "model.layers.23.mlp.experts.26.up_proj", "model.layers.23.mlp.experts.27.up_proj", "model.layers.23.mlp.experts.28.up_proj", "model.layers.23.mlp.experts.29.up_proj", "model.layers.23.mlp.experts.30.up_proj", "model.layers.23.mlp.experts.31.up_proj", "model.layers.23.mlp.experts.32.up_proj", "model.layers.23.mlp.experts.33.up_proj", "model.layers.23.mlp.experts.34.up_proj", "model.layers.23.mlp.experts.35.up_proj", "model.layers.23.mlp.experts.36.up_proj", "model.layers.23.mlp.experts.37.up_proj", "model.layers.23.mlp.experts.38.up_proj", "model.layers.23.mlp.experts.39.up_proj", "model.layers.23.mlp.experts.40.up_proj", "model.layers.23.mlp.experts.41.up_proj", "model.layers.23.mlp.experts.42.up_proj", "model.layers.23.mlp.experts.43.up_proj", "model.layers.23.mlp.experts.44.up_proj", "model.layers.23.mlp.experts.45.up_proj", "model.layers.23.mlp.experts.46.up_proj", "model.layers.23.mlp.experts.47.up_proj", "model.layers.23.mlp.experts.48.up_proj", "model.layers.23.mlp.experts.49.up_proj", "model.layers.23.mlp.experts.50.up_proj", "model.layers.23.mlp.experts.51.up_proj", "model.layers.23.mlp.experts.52.up_proj", "model.layers.23.mlp.experts.53.up_proj", "model.layers.23.mlp.experts.54.up_proj", "model.layers.23.mlp.experts.55.up_proj", "model.layers.23.mlp.experts.56.up_proj", "model.layers.23.mlp.experts.57.up_proj", "model.layers.23.mlp.experts.58.up_proj", "model.layers.23.mlp.experts.59.up_proj", "model.layers.23.mlp.experts.60.up_proj", "model.layers.23.mlp.experts.61.up_proj", "model.layers.23.mlp.experts.62.up_proj", "model.layers.23.mlp.experts.63.up_proj", "model.layers.23.mlp.experts.64.up_proj", "model.layers.23.mlp.experts.65.up_proj", "model.layers.23.mlp.experts.66.up_proj", "model.layers.23.mlp.experts.67.up_proj", "model.layers.23.mlp.experts.68.up_proj", "model.layers.23.mlp.experts.69.up_proj", "model.layers.23.mlp.experts.70.up_proj", "model.layers.23.mlp.experts.71.up_proj", "model.layers.23.mlp.experts.72.up_proj", "model.layers.23.mlp.experts.73.up_proj", "model.layers.23.mlp.experts.74.up_proj", "model.layers.23.mlp.experts.75.up_proj", "model.layers.23.mlp.experts.76.up_proj", "model.layers.23.mlp.experts.77.up_proj", "model.layers.23.mlp.experts.78.up_proj", "model.layers.23.mlp.experts.79.up_proj", "model.layers.23.mlp.experts.80.up_proj", "model.layers.23.mlp.experts.81.up_proj", "model.layers.23.mlp.experts.82.up_proj", "model.layers.23.mlp.experts.83.up_proj", "model.layers.23.mlp.experts.84.up_proj", "model.layers.23.mlp.experts.85.up_proj", "model.layers.23.mlp.experts.86.up_proj", "model.layers.23.mlp.experts.87.up_proj", "model.layers.23.mlp.experts.88.up_proj", "model.layers.23.mlp.experts.89.up_proj", "model.layers.23.mlp.experts.90.up_proj", "model.layers.23.mlp.experts.91.up_proj", "model.layers.23.mlp.experts.92.up_proj", "model.layers.23.mlp.experts.93.up_proj", "model.layers.23.mlp.experts.94.up_proj", "model.layers.23.mlp.experts.95.up_proj", "model.layers.23.mlp.experts.96.up_proj", "model.layers.23.mlp.experts.97.up_proj", "model.layers.23.mlp.experts.98.up_proj", "model.layers.23.mlp.experts.99.up_proj", "model.layers.23.mlp.experts.100.up_proj", "model.layers.23.mlp.experts.101.up_proj", "model.layers.23.mlp.experts.102.up_proj", "model.layers.23.mlp.experts.103.up_proj", "model.layers.23.mlp.experts.104.up_proj", "model.layers.23.mlp.experts.105.up_proj", "model.layers.23.mlp.experts.106.up_proj", "model.layers.23.mlp.experts.107.up_proj", "model.layers.23.mlp.experts.108.up_proj", "model.layers.23.mlp.experts.109.up_proj", "model.layers.23.mlp.experts.110.up_proj", "model.layers.23.mlp.experts.111.up_proj", "model.layers.23.mlp.experts.112.up_proj", "model.layers.23.mlp.experts.113.up_proj", "model.layers.23.mlp.experts.114.up_proj", "model.layers.23.mlp.experts.115.up_proj", "model.layers.23.mlp.experts.116.up_proj", "model.layers.23.mlp.experts.117.up_proj", "model.layers.23.mlp.experts.118.up_proj", "model.layers.23.mlp.experts.119.up_proj", "model.layers.23.mlp.experts.120.up_proj", "model.layers.23.mlp.experts.121.up_proj", "model.layers.23.mlp.experts.122.up_proj", "model.layers.23.mlp.experts.123.up_proj", "model.layers.23.mlp.experts.124.up_proj", "model.layers.23.mlp.experts.125.up_proj", "model.layers.23.mlp.experts.126.up_proj", "model.layers.23.mlp.experts.127.up_proj", "model.layers.23.mlp.experts.128.up_proj", "model.layers.23.mlp.experts.129.up_proj", "model.layers.23.mlp.experts.130.up_proj", "model.layers.23.mlp.experts.131.up_proj", "model.layers.23.mlp.experts.132.up_proj", "model.layers.23.mlp.experts.133.up_proj", "model.layers.23.mlp.experts.134.up_proj", "model.layers.23.mlp.experts.135.up_proj", "model.layers.23.mlp.experts.136.up_proj", "model.layers.23.mlp.experts.137.up_proj", "model.layers.23.mlp.experts.138.up_proj", "model.layers.23.mlp.experts.139.up_proj", "model.layers.23.mlp.experts.140.up_proj", "model.layers.23.mlp.experts.141.up_proj", "model.layers.23.mlp.experts.142.up_proj", "model.layers.23.mlp.experts.143.up_proj", "model.layers.23.mlp.experts.144.up_proj", "model.layers.23.mlp.experts.145.up_proj", "model.layers.23.mlp.experts.146.up_proj", "model.layers.23.mlp.experts.147.up_proj", "model.layers.23.mlp.experts.148.up_proj", "model.layers.23.mlp.experts.149.up_proj", "model.layers.23.mlp.experts.150.up_proj", "model.layers.23.mlp.experts.151.up_proj", "model.layers.23.mlp.experts.152.up_proj", "model.layers.23.mlp.experts.153.up_proj", "model.layers.23.mlp.experts.154.up_proj", "model.layers.23.mlp.experts.155.up_proj", "model.layers.23.mlp.experts.156.up_proj", "model.layers.23.mlp.experts.157.up_proj", "model.layers.23.mlp.experts.158.up_proj", "model.layers.23.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -0.00012306463904678683, "dbits": 2516582400 }, { "dkld": -0.00011755505111068348, "dbits": 5033164800 } ] }, { "idx": 140, "layers": [ "model.layers.23.mlp.experts.0.down_proj", "model.layers.23.mlp.experts.1.down_proj", "model.layers.23.mlp.experts.2.down_proj", "model.layers.23.mlp.experts.3.down_proj", "model.layers.23.mlp.experts.4.down_proj", "model.layers.23.mlp.experts.5.down_proj", "model.layers.23.mlp.experts.6.down_proj", "model.layers.23.mlp.experts.7.down_proj", "model.layers.23.mlp.experts.8.down_proj", "model.layers.23.mlp.experts.9.down_proj", "model.layers.23.mlp.experts.10.down_proj", "model.layers.23.mlp.experts.11.down_proj", "model.layers.23.mlp.experts.12.down_proj", "model.layers.23.mlp.experts.13.down_proj", "model.layers.23.mlp.experts.14.down_proj", "model.layers.23.mlp.experts.15.down_proj", "model.layers.23.mlp.experts.16.down_proj", "model.layers.23.mlp.experts.17.down_proj", "model.layers.23.mlp.experts.18.down_proj", "model.layers.23.mlp.experts.19.down_proj", "model.layers.23.mlp.experts.20.down_proj", "model.layers.23.mlp.experts.21.down_proj", "model.layers.23.mlp.experts.22.down_proj", "model.layers.23.mlp.experts.23.down_proj", "model.layers.23.mlp.experts.24.down_proj", "model.layers.23.mlp.experts.25.down_proj", "model.layers.23.mlp.experts.26.down_proj", "model.layers.23.mlp.experts.27.down_proj", "model.layers.23.mlp.experts.28.down_proj", "model.layers.23.mlp.experts.29.down_proj", "model.layers.23.mlp.experts.30.down_proj", "model.layers.23.mlp.experts.31.down_proj", "model.layers.23.mlp.experts.32.down_proj", "model.layers.23.mlp.experts.33.down_proj", "model.layers.23.mlp.experts.34.down_proj", "model.layers.23.mlp.experts.35.down_proj", "model.layers.23.mlp.experts.36.down_proj", "model.layers.23.mlp.experts.37.down_proj", "model.layers.23.mlp.experts.38.down_proj", "model.layers.23.mlp.experts.39.down_proj", "model.layers.23.mlp.experts.40.down_proj", "model.layers.23.mlp.experts.41.down_proj", "model.layers.23.mlp.experts.42.down_proj", "model.layers.23.mlp.experts.43.down_proj", "model.layers.23.mlp.experts.44.down_proj", "model.layers.23.mlp.experts.45.down_proj", "model.layers.23.mlp.experts.46.down_proj", "model.layers.23.mlp.experts.47.down_proj", "model.layers.23.mlp.experts.48.down_proj", "model.layers.23.mlp.experts.49.down_proj", "model.layers.23.mlp.experts.50.down_proj", "model.layers.23.mlp.experts.51.down_proj", "model.layers.23.mlp.experts.52.down_proj", "model.layers.23.mlp.experts.53.down_proj", "model.layers.23.mlp.experts.54.down_proj", "model.layers.23.mlp.experts.55.down_proj", "model.layers.23.mlp.experts.56.down_proj", "model.layers.23.mlp.experts.57.down_proj", "model.layers.23.mlp.experts.58.down_proj", "model.layers.23.mlp.experts.59.down_proj", "model.layers.23.mlp.experts.60.down_proj", "model.layers.23.mlp.experts.61.down_proj", "model.layers.23.mlp.experts.62.down_proj", "model.layers.23.mlp.experts.63.down_proj", "model.layers.23.mlp.experts.64.down_proj", "model.layers.23.mlp.experts.65.down_proj", "model.layers.23.mlp.experts.66.down_proj", "model.layers.23.mlp.experts.67.down_proj", "model.layers.23.mlp.experts.68.down_proj", "model.layers.23.mlp.experts.69.down_proj", "model.layers.23.mlp.experts.70.down_proj", "model.layers.23.mlp.experts.71.down_proj", "model.layers.23.mlp.experts.72.down_proj", "model.layers.23.mlp.experts.73.down_proj", "model.layers.23.mlp.experts.74.down_proj", "model.layers.23.mlp.experts.75.down_proj", "model.layers.23.mlp.experts.76.down_proj", "model.layers.23.mlp.experts.77.down_proj", "model.layers.23.mlp.experts.78.down_proj", "model.layers.23.mlp.experts.79.down_proj", "model.layers.23.mlp.experts.80.down_proj", "model.layers.23.mlp.experts.81.down_proj", "model.layers.23.mlp.experts.82.down_proj", "model.layers.23.mlp.experts.83.down_proj", "model.layers.23.mlp.experts.84.down_proj", "model.layers.23.mlp.experts.85.down_proj", "model.layers.23.mlp.experts.86.down_proj", "model.layers.23.mlp.experts.87.down_proj", "model.layers.23.mlp.experts.88.down_proj", "model.layers.23.mlp.experts.89.down_proj", "model.layers.23.mlp.experts.90.down_proj", "model.layers.23.mlp.experts.91.down_proj", "model.layers.23.mlp.experts.92.down_proj", "model.layers.23.mlp.experts.93.down_proj", "model.layers.23.mlp.experts.94.down_proj", "model.layers.23.mlp.experts.95.down_proj", "model.layers.23.mlp.experts.96.down_proj", "model.layers.23.mlp.experts.97.down_proj", "model.layers.23.mlp.experts.98.down_proj", "model.layers.23.mlp.experts.99.down_proj", "model.layers.23.mlp.experts.100.down_proj", "model.layers.23.mlp.experts.101.down_proj", "model.layers.23.mlp.experts.102.down_proj", "model.layers.23.mlp.experts.103.down_proj", "model.layers.23.mlp.experts.104.down_proj", "model.layers.23.mlp.experts.105.down_proj", "model.layers.23.mlp.experts.106.down_proj", "model.layers.23.mlp.experts.107.down_proj", "model.layers.23.mlp.experts.108.down_proj", "model.layers.23.mlp.experts.109.down_proj", "model.layers.23.mlp.experts.110.down_proj", "model.layers.23.mlp.experts.111.down_proj", "model.layers.23.mlp.experts.112.down_proj", "model.layers.23.mlp.experts.113.down_proj", "model.layers.23.mlp.experts.114.down_proj", "model.layers.23.mlp.experts.115.down_proj", "model.layers.23.mlp.experts.116.down_proj", "model.layers.23.mlp.experts.117.down_proj", "model.layers.23.mlp.experts.118.down_proj", "model.layers.23.mlp.experts.119.down_proj", "model.layers.23.mlp.experts.120.down_proj", "model.layers.23.mlp.experts.121.down_proj", "model.layers.23.mlp.experts.122.down_proj", "model.layers.23.mlp.experts.123.down_proj", "model.layers.23.mlp.experts.124.down_proj", "model.layers.23.mlp.experts.125.down_proj", "model.layers.23.mlp.experts.126.down_proj", "model.layers.23.mlp.experts.127.down_proj", "model.layers.23.mlp.experts.128.down_proj", "model.layers.23.mlp.experts.129.down_proj", "model.layers.23.mlp.experts.130.down_proj", "model.layers.23.mlp.experts.131.down_proj", "model.layers.23.mlp.experts.132.down_proj", "model.layers.23.mlp.experts.133.down_proj", "model.layers.23.mlp.experts.134.down_proj", "model.layers.23.mlp.experts.135.down_proj", "model.layers.23.mlp.experts.136.down_proj", "model.layers.23.mlp.experts.137.down_proj", "model.layers.23.mlp.experts.138.down_proj", "model.layers.23.mlp.experts.139.down_proj", "model.layers.23.mlp.experts.140.down_proj", "model.layers.23.mlp.experts.141.down_proj", "model.layers.23.mlp.experts.142.down_proj", "model.layers.23.mlp.experts.143.down_proj", "model.layers.23.mlp.experts.144.down_proj", "model.layers.23.mlp.experts.145.down_proj", "model.layers.23.mlp.experts.146.down_proj", "model.layers.23.mlp.experts.147.down_proj", "model.layers.23.mlp.experts.148.down_proj", "model.layers.23.mlp.experts.149.down_proj", "model.layers.23.mlp.experts.150.down_proj", "model.layers.23.mlp.experts.151.down_proj", "model.layers.23.mlp.experts.152.down_proj", "model.layers.23.mlp.experts.153.down_proj", "model.layers.23.mlp.experts.154.down_proj", "model.layers.23.mlp.experts.155.down_proj", "model.layers.23.mlp.experts.156.down_proj", "model.layers.23.mlp.experts.157.down_proj", "model.layers.23.mlp.experts.158.down_proj", "model.layers.23.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -4.3908273801206155e-05, "dbits": 1258291200 }, { "dkld": -3.0583376064895196e-05, "dbits": 2516582400 } ] }, { "idx": 141, "layers": [ "model.layers.24.self_attn.q_proj" ], "candidates": [ { "dkld": -0.00010320062283426454, "dbits": 62914560 }, { "dkld": -9.743242990225415e-05, "dbits": 125829120 } ] }, { "idx": 142, "layers": [ "model.layers.24.self_attn.k_proj", "model.layers.24.self_attn.v_proj" ], "candidates": [ { "dkld": -6.30661845207204e-05, "dbits": 10485760 }, { "dkld": -0.00012964829802513018, "dbits": 20971520 } ] }, { "idx": 143, "layers": [ "model.layers.24.self_attn.o_proj" ], "candidates": [ { "dkld": -1.9858614541588826e-05, "dbits": 62914560 }, { "dkld": -0.00015443996526300768, "dbits": 125829120 } ] }, { "idx": 144, "layers": [ "model.layers.24.mlp.shared_experts.gate_proj", "model.layers.24.mlp.shared_experts.up_proj", "model.layers.24.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 4.131263121962686e-05, "dbits": 23592960 }, { "dkld": -0.00012651202268898487, "dbits": 47185920 } ] }, { "idx": 145, "layers": [ "model.layers.24.mlp.experts.0.gate_proj", "model.layers.24.mlp.experts.1.gate_proj", "model.layers.24.mlp.experts.2.gate_proj", "model.layers.24.mlp.experts.3.gate_proj", "model.layers.24.mlp.experts.4.gate_proj", "model.layers.24.mlp.experts.5.gate_proj", "model.layers.24.mlp.experts.6.gate_proj", "model.layers.24.mlp.experts.7.gate_proj", "model.layers.24.mlp.experts.8.gate_proj", "model.layers.24.mlp.experts.9.gate_proj", "model.layers.24.mlp.experts.10.gate_proj", "model.layers.24.mlp.experts.11.gate_proj", "model.layers.24.mlp.experts.12.gate_proj", "model.layers.24.mlp.experts.13.gate_proj", "model.layers.24.mlp.experts.14.gate_proj", "model.layers.24.mlp.experts.15.gate_proj", "model.layers.24.mlp.experts.16.gate_proj", "model.layers.24.mlp.experts.17.gate_proj", "model.layers.24.mlp.experts.18.gate_proj", "model.layers.24.mlp.experts.19.gate_proj", "model.layers.24.mlp.experts.20.gate_proj", "model.layers.24.mlp.experts.21.gate_proj", "model.layers.24.mlp.experts.22.gate_proj", "model.layers.24.mlp.experts.23.gate_proj", "model.layers.24.mlp.experts.24.gate_proj", "model.layers.24.mlp.experts.25.gate_proj", "model.layers.24.mlp.experts.26.gate_proj", "model.layers.24.mlp.experts.27.gate_proj", "model.layers.24.mlp.experts.28.gate_proj", "model.layers.24.mlp.experts.29.gate_proj", "model.layers.24.mlp.experts.30.gate_proj", "model.layers.24.mlp.experts.31.gate_proj", "model.layers.24.mlp.experts.32.gate_proj", "model.layers.24.mlp.experts.33.gate_proj", "model.layers.24.mlp.experts.34.gate_proj", "model.layers.24.mlp.experts.35.gate_proj", "model.layers.24.mlp.experts.36.gate_proj", "model.layers.24.mlp.experts.37.gate_proj", "model.layers.24.mlp.experts.38.gate_proj", "model.layers.24.mlp.experts.39.gate_proj", "model.layers.24.mlp.experts.40.gate_proj", "model.layers.24.mlp.experts.41.gate_proj", "model.layers.24.mlp.experts.42.gate_proj", "model.layers.24.mlp.experts.43.gate_proj", "model.layers.24.mlp.experts.44.gate_proj", "model.layers.24.mlp.experts.45.gate_proj", "model.layers.24.mlp.experts.46.gate_proj", "model.layers.24.mlp.experts.47.gate_proj", "model.layers.24.mlp.experts.48.gate_proj", "model.layers.24.mlp.experts.49.gate_proj", "model.layers.24.mlp.experts.50.gate_proj", "model.layers.24.mlp.experts.51.gate_proj", "model.layers.24.mlp.experts.52.gate_proj", "model.layers.24.mlp.experts.53.gate_proj", "model.layers.24.mlp.experts.54.gate_proj", "model.layers.24.mlp.experts.55.gate_proj", "model.layers.24.mlp.experts.56.gate_proj", "model.layers.24.mlp.experts.57.gate_proj", "model.layers.24.mlp.experts.58.gate_proj", "model.layers.24.mlp.experts.59.gate_proj", "model.layers.24.mlp.experts.60.gate_proj", "model.layers.24.mlp.experts.61.gate_proj", "model.layers.24.mlp.experts.62.gate_proj", "model.layers.24.mlp.experts.63.gate_proj", "model.layers.24.mlp.experts.64.gate_proj", "model.layers.24.mlp.experts.65.gate_proj", "model.layers.24.mlp.experts.66.gate_proj", "model.layers.24.mlp.experts.67.gate_proj", "model.layers.24.mlp.experts.68.gate_proj", "model.layers.24.mlp.experts.69.gate_proj", "model.layers.24.mlp.experts.70.gate_proj", "model.layers.24.mlp.experts.71.gate_proj", "model.layers.24.mlp.experts.72.gate_proj", "model.layers.24.mlp.experts.73.gate_proj", "model.layers.24.mlp.experts.74.gate_proj", "model.layers.24.mlp.experts.75.gate_proj", "model.layers.24.mlp.experts.76.gate_proj", "model.layers.24.mlp.experts.77.gate_proj", "model.layers.24.mlp.experts.78.gate_proj", "model.layers.24.mlp.experts.79.gate_proj", "model.layers.24.mlp.experts.80.gate_proj", "model.layers.24.mlp.experts.81.gate_proj", "model.layers.24.mlp.experts.82.gate_proj", "model.layers.24.mlp.experts.83.gate_proj", "model.layers.24.mlp.experts.84.gate_proj", "model.layers.24.mlp.experts.85.gate_proj", "model.layers.24.mlp.experts.86.gate_proj", "model.layers.24.mlp.experts.87.gate_proj", "model.layers.24.mlp.experts.88.gate_proj", "model.layers.24.mlp.experts.89.gate_proj", "model.layers.24.mlp.experts.90.gate_proj", "model.layers.24.mlp.experts.91.gate_proj", "model.layers.24.mlp.experts.92.gate_proj", "model.layers.24.mlp.experts.93.gate_proj", "model.layers.24.mlp.experts.94.gate_proj", "model.layers.24.mlp.experts.95.gate_proj", "model.layers.24.mlp.experts.96.gate_proj", "model.layers.24.mlp.experts.97.gate_proj", "model.layers.24.mlp.experts.98.gate_proj", "model.layers.24.mlp.experts.99.gate_proj", "model.layers.24.mlp.experts.100.gate_proj", "model.layers.24.mlp.experts.101.gate_proj", "model.layers.24.mlp.experts.102.gate_proj", "model.layers.24.mlp.experts.103.gate_proj", "model.layers.24.mlp.experts.104.gate_proj", "model.layers.24.mlp.experts.105.gate_proj", "model.layers.24.mlp.experts.106.gate_proj", "model.layers.24.mlp.experts.107.gate_proj", "model.layers.24.mlp.experts.108.gate_proj", "model.layers.24.mlp.experts.109.gate_proj", "model.layers.24.mlp.experts.110.gate_proj", "model.layers.24.mlp.experts.111.gate_proj", "model.layers.24.mlp.experts.112.gate_proj", "model.layers.24.mlp.experts.113.gate_proj", "model.layers.24.mlp.experts.114.gate_proj", "model.layers.24.mlp.experts.115.gate_proj", "model.layers.24.mlp.experts.116.gate_proj", "model.layers.24.mlp.experts.117.gate_proj", "model.layers.24.mlp.experts.118.gate_proj", "model.layers.24.mlp.experts.119.gate_proj", "model.layers.24.mlp.experts.120.gate_proj", "model.layers.24.mlp.experts.121.gate_proj", "model.layers.24.mlp.experts.122.gate_proj", "model.layers.24.mlp.experts.123.gate_proj", "model.layers.24.mlp.experts.124.gate_proj", "model.layers.24.mlp.experts.125.gate_proj", "model.layers.24.mlp.experts.126.gate_proj", "model.layers.24.mlp.experts.127.gate_proj", "model.layers.24.mlp.experts.128.gate_proj", "model.layers.24.mlp.experts.129.gate_proj", "model.layers.24.mlp.experts.130.gate_proj", "model.layers.24.mlp.experts.131.gate_proj", "model.layers.24.mlp.experts.132.gate_proj", "model.layers.24.mlp.experts.133.gate_proj", "model.layers.24.mlp.experts.134.gate_proj", "model.layers.24.mlp.experts.135.gate_proj", "model.layers.24.mlp.experts.136.gate_proj", "model.layers.24.mlp.experts.137.gate_proj", "model.layers.24.mlp.experts.138.gate_proj", "model.layers.24.mlp.experts.139.gate_proj", "model.layers.24.mlp.experts.140.gate_proj", "model.layers.24.mlp.experts.141.gate_proj", "model.layers.24.mlp.experts.142.gate_proj", "model.layers.24.mlp.experts.143.gate_proj", "model.layers.24.mlp.experts.144.gate_proj", "model.layers.24.mlp.experts.145.gate_proj", "model.layers.24.mlp.experts.146.gate_proj", "model.layers.24.mlp.experts.147.gate_proj", "model.layers.24.mlp.experts.148.gate_proj", "model.layers.24.mlp.experts.149.gate_proj", "model.layers.24.mlp.experts.150.gate_proj", "model.layers.24.mlp.experts.151.gate_proj", "model.layers.24.mlp.experts.152.gate_proj", "model.layers.24.mlp.experts.153.gate_proj", "model.layers.24.mlp.experts.154.gate_proj", "model.layers.24.mlp.experts.155.gate_proj", "model.layers.24.mlp.experts.156.gate_proj", "model.layers.24.mlp.experts.157.gate_proj", "model.layers.24.mlp.experts.158.gate_proj", "model.layers.24.mlp.experts.159.gate_proj", "model.layers.24.mlp.experts.0.up_proj", "model.layers.24.mlp.experts.1.up_proj", "model.layers.24.mlp.experts.2.up_proj", "model.layers.24.mlp.experts.3.up_proj", "model.layers.24.mlp.experts.4.up_proj", "model.layers.24.mlp.experts.5.up_proj", "model.layers.24.mlp.experts.6.up_proj", "model.layers.24.mlp.experts.7.up_proj", "model.layers.24.mlp.experts.8.up_proj", "model.layers.24.mlp.experts.9.up_proj", "model.layers.24.mlp.experts.10.up_proj", "model.layers.24.mlp.experts.11.up_proj", "model.layers.24.mlp.experts.12.up_proj", "model.layers.24.mlp.experts.13.up_proj", "model.layers.24.mlp.experts.14.up_proj", "model.layers.24.mlp.experts.15.up_proj", "model.layers.24.mlp.experts.16.up_proj", "model.layers.24.mlp.experts.17.up_proj", "model.layers.24.mlp.experts.18.up_proj", "model.layers.24.mlp.experts.19.up_proj", "model.layers.24.mlp.experts.20.up_proj", "model.layers.24.mlp.experts.21.up_proj", "model.layers.24.mlp.experts.22.up_proj", "model.layers.24.mlp.experts.23.up_proj", "model.layers.24.mlp.experts.24.up_proj", "model.layers.24.mlp.experts.25.up_proj", "model.layers.24.mlp.experts.26.up_proj", "model.layers.24.mlp.experts.27.up_proj", "model.layers.24.mlp.experts.28.up_proj", "model.layers.24.mlp.experts.29.up_proj", "model.layers.24.mlp.experts.30.up_proj", "model.layers.24.mlp.experts.31.up_proj", "model.layers.24.mlp.experts.32.up_proj", "model.layers.24.mlp.experts.33.up_proj", "model.layers.24.mlp.experts.34.up_proj", "model.layers.24.mlp.experts.35.up_proj", "model.layers.24.mlp.experts.36.up_proj", "model.layers.24.mlp.experts.37.up_proj", "model.layers.24.mlp.experts.38.up_proj", "model.layers.24.mlp.experts.39.up_proj", "model.layers.24.mlp.experts.40.up_proj", "model.layers.24.mlp.experts.41.up_proj", "model.layers.24.mlp.experts.42.up_proj", "model.layers.24.mlp.experts.43.up_proj", "model.layers.24.mlp.experts.44.up_proj", "model.layers.24.mlp.experts.45.up_proj", "model.layers.24.mlp.experts.46.up_proj", "model.layers.24.mlp.experts.47.up_proj", "model.layers.24.mlp.experts.48.up_proj", "model.layers.24.mlp.experts.49.up_proj", "model.layers.24.mlp.experts.50.up_proj", "model.layers.24.mlp.experts.51.up_proj", "model.layers.24.mlp.experts.52.up_proj", "model.layers.24.mlp.experts.53.up_proj", "model.layers.24.mlp.experts.54.up_proj", "model.layers.24.mlp.experts.55.up_proj", "model.layers.24.mlp.experts.56.up_proj", "model.layers.24.mlp.experts.57.up_proj", "model.layers.24.mlp.experts.58.up_proj", "model.layers.24.mlp.experts.59.up_proj", "model.layers.24.mlp.experts.60.up_proj", "model.layers.24.mlp.experts.61.up_proj", "model.layers.24.mlp.experts.62.up_proj", "model.layers.24.mlp.experts.63.up_proj", "model.layers.24.mlp.experts.64.up_proj", "model.layers.24.mlp.experts.65.up_proj", "model.layers.24.mlp.experts.66.up_proj", "model.layers.24.mlp.experts.67.up_proj", "model.layers.24.mlp.experts.68.up_proj", "model.layers.24.mlp.experts.69.up_proj", "model.layers.24.mlp.experts.70.up_proj", "model.layers.24.mlp.experts.71.up_proj", "model.layers.24.mlp.experts.72.up_proj", "model.layers.24.mlp.experts.73.up_proj", "model.layers.24.mlp.experts.74.up_proj", "model.layers.24.mlp.experts.75.up_proj", "model.layers.24.mlp.experts.76.up_proj", "model.layers.24.mlp.experts.77.up_proj", "model.layers.24.mlp.experts.78.up_proj", "model.layers.24.mlp.experts.79.up_proj", "model.layers.24.mlp.experts.80.up_proj", "model.layers.24.mlp.experts.81.up_proj", "model.layers.24.mlp.experts.82.up_proj", "model.layers.24.mlp.experts.83.up_proj", "model.layers.24.mlp.experts.84.up_proj", "model.layers.24.mlp.experts.85.up_proj", "model.layers.24.mlp.experts.86.up_proj", "model.layers.24.mlp.experts.87.up_proj", "model.layers.24.mlp.experts.88.up_proj", "model.layers.24.mlp.experts.89.up_proj", "model.layers.24.mlp.experts.90.up_proj", "model.layers.24.mlp.experts.91.up_proj", "model.layers.24.mlp.experts.92.up_proj", "model.layers.24.mlp.experts.93.up_proj", "model.layers.24.mlp.experts.94.up_proj", "model.layers.24.mlp.experts.95.up_proj", "model.layers.24.mlp.experts.96.up_proj", "model.layers.24.mlp.experts.97.up_proj", "model.layers.24.mlp.experts.98.up_proj", "model.layers.24.mlp.experts.99.up_proj", "model.layers.24.mlp.experts.100.up_proj", "model.layers.24.mlp.experts.101.up_proj", "model.layers.24.mlp.experts.102.up_proj", "model.layers.24.mlp.experts.103.up_proj", "model.layers.24.mlp.experts.104.up_proj", "model.layers.24.mlp.experts.105.up_proj", "model.layers.24.mlp.experts.106.up_proj", "model.layers.24.mlp.experts.107.up_proj", "model.layers.24.mlp.experts.108.up_proj", "model.layers.24.mlp.experts.109.up_proj", "model.layers.24.mlp.experts.110.up_proj", "model.layers.24.mlp.experts.111.up_proj", "model.layers.24.mlp.experts.112.up_proj", "model.layers.24.mlp.experts.113.up_proj", "model.layers.24.mlp.experts.114.up_proj", "model.layers.24.mlp.experts.115.up_proj", "model.layers.24.mlp.experts.116.up_proj", "model.layers.24.mlp.experts.117.up_proj", "model.layers.24.mlp.experts.118.up_proj", "model.layers.24.mlp.experts.119.up_proj", "model.layers.24.mlp.experts.120.up_proj", "model.layers.24.mlp.experts.121.up_proj", "model.layers.24.mlp.experts.122.up_proj", "model.layers.24.mlp.experts.123.up_proj", "model.layers.24.mlp.experts.124.up_proj", "model.layers.24.mlp.experts.125.up_proj", "model.layers.24.mlp.experts.126.up_proj", "model.layers.24.mlp.experts.127.up_proj", "model.layers.24.mlp.experts.128.up_proj", "model.layers.24.mlp.experts.129.up_proj", "model.layers.24.mlp.experts.130.up_proj", "model.layers.24.mlp.experts.131.up_proj", "model.layers.24.mlp.experts.132.up_proj", "model.layers.24.mlp.experts.133.up_proj", "model.layers.24.mlp.experts.134.up_proj", "model.layers.24.mlp.experts.135.up_proj", "model.layers.24.mlp.experts.136.up_proj", "model.layers.24.mlp.experts.137.up_proj", "model.layers.24.mlp.experts.138.up_proj", "model.layers.24.mlp.experts.139.up_proj", "model.layers.24.mlp.experts.140.up_proj", "model.layers.24.mlp.experts.141.up_proj", "model.layers.24.mlp.experts.142.up_proj", "model.layers.24.mlp.experts.143.up_proj", "model.layers.24.mlp.experts.144.up_proj", "model.layers.24.mlp.experts.145.up_proj", "model.layers.24.mlp.experts.146.up_proj", "model.layers.24.mlp.experts.147.up_proj", "model.layers.24.mlp.experts.148.up_proj", "model.layers.24.mlp.experts.149.up_proj", "model.layers.24.mlp.experts.150.up_proj", "model.layers.24.mlp.experts.151.up_proj", "model.layers.24.mlp.experts.152.up_proj", "model.layers.24.mlp.experts.153.up_proj", "model.layers.24.mlp.experts.154.up_proj", "model.layers.24.mlp.experts.155.up_proj", "model.layers.24.mlp.experts.156.up_proj", "model.layers.24.mlp.experts.157.up_proj", "model.layers.24.mlp.experts.158.up_proj", "model.layers.24.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -4.515890032051606e-06, "dbits": 2516582400 }, { "dkld": -3.828024491667713e-05, "dbits": 5033164800 } ] }, { "idx": 146, "layers": [ "model.layers.24.mlp.experts.0.down_proj", "model.layers.24.mlp.experts.1.down_proj", "model.layers.24.mlp.experts.2.down_proj", "model.layers.24.mlp.experts.3.down_proj", "model.layers.24.mlp.experts.4.down_proj", "model.layers.24.mlp.experts.5.down_proj", "model.layers.24.mlp.experts.6.down_proj", "model.layers.24.mlp.experts.7.down_proj", "model.layers.24.mlp.experts.8.down_proj", "model.layers.24.mlp.experts.9.down_proj", "model.layers.24.mlp.experts.10.down_proj", "model.layers.24.mlp.experts.11.down_proj", "model.layers.24.mlp.experts.12.down_proj", "model.layers.24.mlp.experts.13.down_proj", "model.layers.24.mlp.experts.14.down_proj", "model.layers.24.mlp.experts.15.down_proj", "model.layers.24.mlp.experts.16.down_proj", "model.layers.24.mlp.experts.17.down_proj", "model.layers.24.mlp.experts.18.down_proj", "model.layers.24.mlp.experts.19.down_proj", "model.layers.24.mlp.experts.20.down_proj", "model.layers.24.mlp.experts.21.down_proj", "model.layers.24.mlp.experts.22.down_proj", "model.layers.24.mlp.experts.23.down_proj", "model.layers.24.mlp.experts.24.down_proj", "model.layers.24.mlp.experts.25.down_proj", "model.layers.24.mlp.experts.26.down_proj", "model.layers.24.mlp.experts.27.down_proj", "model.layers.24.mlp.experts.28.down_proj", "model.layers.24.mlp.experts.29.down_proj", "model.layers.24.mlp.experts.30.down_proj", "model.layers.24.mlp.experts.31.down_proj", "model.layers.24.mlp.experts.32.down_proj", "model.layers.24.mlp.experts.33.down_proj", "model.layers.24.mlp.experts.34.down_proj", "model.layers.24.mlp.experts.35.down_proj", "model.layers.24.mlp.experts.36.down_proj", "model.layers.24.mlp.experts.37.down_proj", "model.layers.24.mlp.experts.38.down_proj", "model.layers.24.mlp.experts.39.down_proj", "model.layers.24.mlp.experts.40.down_proj", "model.layers.24.mlp.experts.41.down_proj", "model.layers.24.mlp.experts.42.down_proj", "model.layers.24.mlp.experts.43.down_proj", "model.layers.24.mlp.experts.44.down_proj", "model.layers.24.mlp.experts.45.down_proj", "model.layers.24.mlp.experts.46.down_proj", "model.layers.24.mlp.experts.47.down_proj", "model.layers.24.mlp.experts.48.down_proj", "model.layers.24.mlp.experts.49.down_proj", "model.layers.24.mlp.experts.50.down_proj", "model.layers.24.mlp.experts.51.down_proj", "model.layers.24.mlp.experts.52.down_proj", "model.layers.24.mlp.experts.53.down_proj", "model.layers.24.mlp.experts.54.down_proj", "model.layers.24.mlp.experts.55.down_proj", "model.layers.24.mlp.experts.56.down_proj", "model.layers.24.mlp.experts.57.down_proj", "model.layers.24.mlp.experts.58.down_proj", "model.layers.24.mlp.experts.59.down_proj", "model.layers.24.mlp.experts.60.down_proj", "model.layers.24.mlp.experts.61.down_proj", "model.layers.24.mlp.experts.62.down_proj", "model.layers.24.mlp.experts.63.down_proj", "model.layers.24.mlp.experts.64.down_proj", "model.layers.24.mlp.experts.65.down_proj", "model.layers.24.mlp.experts.66.down_proj", "model.layers.24.mlp.experts.67.down_proj", "model.layers.24.mlp.experts.68.down_proj", "model.layers.24.mlp.experts.69.down_proj", "model.layers.24.mlp.experts.70.down_proj", "model.layers.24.mlp.experts.71.down_proj", "model.layers.24.mlp.experts.72.down_proj", "model.layers.24.mlp.experts.73.down_proj", "model.layers.24.mlp.experts.74.down_proj", "model.layers.24.mlp.experts.75.down_proj", "model.layers.24.mlp.experts.76.down_proj", "model.layers.24.mlp.experts.77.down_proj", "model.layers.24.mlp.experts.78.down_proj", "model.layers.24.mlp.experts.79.down_proj", "model.layers.24.mlp.experts.80.down_proj", "model.layers.24.mlp.experts.81.down_proj", "model.layers.24.mlp.experts.82.down_proj", "model.layers.24.mlp.experts.83.down_proj", "model.layers.24.mlp.experts.84.down_proj", "model.layers.24.mlp.experts.85.down_proj", "model.layers.24.mlp.experts.86.down_proj", "model.layers.24.mlp.experts.87.down_proj", "model.layers.24.mlp.experts.88.down_proj", "model.layers.24.mlp.experts.89.down_proj", "model.layers.24.mlp.experts.90.down_proj", "model.layers.24.mlp.experts.91.down_proj", "model.layers.24.mlp.experts.92.down_proj", "model.layers.24.mlp.experts.93.down_proj", "model.layers.24.mlp.experts.94.down_proj", "model.layers.24.mlp.experts.95.down_proj", "model.layers.24.mlp.experts.96.down_proj", "model.layers.24.mlp.experts.97.down_proj", "model.layers.24.mlp.experts.98.down_proj", "model.layers.24.mlp.experts.99.down_proj", "model.layers.24.mlp.experts.100.down_proj", "model.layers.24.mlp.experts.101.down_proj", "model.layers.24.mlp.experts.102.down_proj", "model.layers.24.mlp.experts.103.down_proj", "model.layers.24.mlp.experts.104.down_proj", "model.layers.24.mlp.experts.105.down_proj", "model.layers.24.mlp.experts.106.down_proj", "model.layers.24.mlp.experts.107.down_proj", "model.layers.24.mlp.experts.108.down_proj", "model.layers.24.mlp.experts.109.down_proj", "model.layers.24.mlp.experts.110.down_proj", "model.layers.24.mlp.experts.111.down_proj", "model.layers.24.mlp.experts.112.down_proj", "model.layers.24.mlp.experts.113.down_proj", "model.layers.24.mlp.experts.114.down_proj", "model.layers.24.mlp.experts.115.down_proj", "model.layers.24.mlp.experts.116.down_proj", "model.layers.24.mlp.experts.117.down_proj", "model.layers.24.mlp.experts.118.down_proj", "model.layers.24.mlp.experts.119.down_proj", "model.layers.24.mlp.experts.120.down_proj", "model.layers.24.mlp.experts.121.down_proj", "model.layers.24.mlp.experts.122.down_proj", "model.layers.24.mlp.experts.123.down_proj", "model.layers.24.mlp.experts.124.down_proj", "model.layers.24.mlp.experts.125.down_proj", "model.layers.24.mlp.experts.126.down_proj", "model.layers.24.mlp.experts.127.down_proj", "model.layers.24.mlp.experts.128.down_proj", "model.layers.24.mlp.experts.129.down_proj", "model.layers.24.mlp.experts.130.down_proj", "model.layers.24.mlp.experts.131.down_proj", "model.layers.24.mlp.experts.132.down_proj", "model.layers.24.mlp.experts.133.down_proj", "model.layers.24.mlp.experts.134.down_proj", "model.layers.24.mlp.experts.135.down_proj", "model.layers.24.mlp.experts.136.down_proj", "model.layers.24.mlp.experts.137.down_proj", "model.layers.24.mlp.experts.138.down_proj", "model.layers.24.mlp.experts.139.down_proj", "model.layers.24.mlp.experts.140.down_proj", "model.layers.24.mlp.experts.141.down_proj", "model.layers.24.mlp.experts.142.down_proj", "model.layers.24.mlp.experts.143.down_proj", "model.layers.24.mlp.experts.144.down_proj", "model.layers.24.mlp.experts.145.down_proj", "model.layers.24.mlp.experts.146.down_proj", "model.layers.24.mlp.experts.147.down_proj", "model.layers.24.mlp.experts.148.down_proj", "model.layers.24.mlp.experts.149.down_proj", "model.layers.24.mlp.experts.150.down_proj", "model.layers.24.mlp.experts.151.down_proj", "model.layers.24.mlp.experts.152.down_proj", "model.layers.24.mlp.experts.153.down_proj", "model.layers.24.mlp.experts.154.down_proj", "model.layers.24.mlp.experts.155.down_proj", "model.layers.24.mlp.experts.156.down_proj", "model.layers.24.mlp.experts.157.down_proj", "model.layers.24.mlp.experts.158.down_proj", "model.layers.24.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -4.6759215183555386e-05, "dbits": 1258291200 }, { "dkld": -6.235078908502917e-05, "dbits": 2516582400 } ] }, { "idx": 147, "layers": [ "model.layers.25.self_attn.q_proj" ], "candidates": [ { "dkld": -6.601428613066569e-05, "dbits": 62914560 }, { "dkld": -9.225199464708497e-05, "dbits": 125829120 } ] }, { "idx": 148, "layers": [ "model.layers.25.self_attn.k_proj", "model.layers.25.self_attn.v_proj" ], "candidates": [ { "dkld": -7.595880888402323e-05, "dbits": 10485760 }, { "dkld": -4.2387680150567444e-05, "dbits": 20971520 } ] }, { "idx": 149, "layers": [ "model.layers.25.self_attn.o_proj" ], "candidates": [ { "dkld": -2.604911569505791e-05, "dbits": 62914560 }, { "dkld": -5.145659670233692e-05, "dbits": 125829120 } ] }, { "idx": 150, "layers": [ "model.layers.25.mlp.shared_experts.gate_proj", "model.layers.25.mlp.shared_experts.up_proj", "model.layers.25.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 8.517436217516695e-05, "dbits": 23592960 }, { "dkld": 2.673659473657712e-05, "dbits": 47185920 } ] }, { "idx": 151, "layers": [ "model.layers.25.mlp.experts.0.gate_proj", "model.layers.25.mlp.experts.1.gate_proj", "model.layers.25.mlp.experts.2.gate_proj", "model.layers.25.mlp.experts.3.gate_proj", "model.layers.25.mlp.experts.4.gate_proj", "model.layers.25.mlp.experts.5.gate_proj", "model.layers.25.mlp.experts.6.gate_proj", "model.layers.25.mlp.experts.7.gate_proj", "model.layers.25.mlp.experts.8.gate_proj", "model.layers.25.mlp.experts.9.gate_proj", "model.layers.25.mlp.experts.10.gate_proj", "model.layers.25.mlp.experts.11.gate_proj", "model.layers.25.mlp.experts.12.gate_proj", "model.layers.25.mlp.experts.13.gate_proj", "model.layers.25.mlp.experts.14.gate_proj", "model.layers.25.mlp.experts.15.gate_proj", "model.layers.25.mlp.experts.16.gate_proj", "model.layers.25.mlp.experts.17.gate_proj", "model.layers.25.mlp.experts.18.gate_proj", "model.layers.25.mlp.experts.19.gate_proj", "model.layers.25.mlp.experts.20.gate_proj", "model.layers.25.mlp.experts.21.gate_proj", "model.layers.25.mlp.experts.22.gate_proj", "model.layers.25.mlp.experts.23.gate_proj", "model.layers.25.mlp.experts.24.gate_proj", "model.layers.25.mlp.experts.25.gate_proj", "model.layers.25.mlp.experts.26.gate_proj", "model.layers.25.mlp.experts.27.gate_proj", "model.layers.25.mlp.experts.28.gate_proj", "model.layers.25.mlp.experts.29.gate_proj", "model.layers.25.mlp.experts.30.gate_proj", "model.layers.25.mlp.experts.31.gate_proj", "model.layers.25.mlp.experts.32.gate_proj", "model.layers.25.mlp.experts.33.gate_proj", "model.layers.25.mlp.experts.34.gate_proj", "model.layers.25.mlp.experts.35.gate_proj", "model.layers.25.mlp.experts.36.gate_proj", "model.layers.25.mlp.experts.37.gate_proj", "model.layers.25.mlp.experts.38.gate_proj", "model.layers.25.mlp.experts.39.gate_proj", "model.layers.25.mlp.experts.40.gate_proj", "model.layers.25.mlp.experts.41.gate_proj", "model.layers.25.mlp.experts.42.gate_proj", "model.layers.25.mlp.experts.43.gate_proj", "model.layers.25.mlp.experts.44.gate_proj", "model.layers.25.mlp.experts.45.gate_proj", "model.layers.25.mlp.experts.46.gate_proj", "model.layers.25.mlp.experts.47.gate_proj", "model.layers.25.mlp.experts.48.gate_proj", "model.layers.25.mlp.experts.49.gate_proj", "model.layers.25.mlp.experts.50.gate_proj", "model.layers.25.mlp.experts.51.gate_proj", "model.layers.25.mlp.experts.52.gate_proj", "model.layers.25.mlp.experts.53.gate_proj", "model.layers.25.mlp.experts.54.gate_proj", "model.layers.25.mlp.experts.55.gate_proj", "model.layers.25.mlp.experts.56.gate_proj", "model.layers.25.mlp.experts.57.gate_proj", "model.layers.25.mlp.experts.58.gate_proj", "model.layers.25.mlp.experts.59.gate_proj", "model.layers.25.mlp.experts.60.gate_proj", "model.layers.25.mlp.experts.61.gate_proj", "model.layers.25.mlp.experts.62.gate_proj", "model.layers.25.mlp.experts.63.gate_proj", "model.layers.25.mlp.experts.64.gate_proj", "model.layers.25.mlp.experts.65.gate_proj", "model.layers.25.mlp.experts.66.gate_proj", "model.layers.25.mlp.experts.67.gate_proj", "model.layers.25.mlp.experts.68.gate_proj", "model.layers.25.mlp.experts.69.gate_proj", "model.layers.25.mlp.experts.70.gate_proj", "model.layers.25.mlp.experts.71.gate_proj", "model.layers.25.mlp.experts.72.gate_proj", "model.layers.25.mlp.experts.73.gate_proj", "model.layers.25.mlp.experts.74.gate_proj", "model.layers.25.mlp.experts.75.gate_proj", "model.layers.25.mlp.experts.76.gate_proj", "model.layers.25.mlp.experts.77.gate_proj", "model.layers.25.mlp.experts.78.gate_proj", "model.layers.25.mlp.experts.79.gate_proj", "model.layers.25.mlp.experts.80.gate_proj", "model.layers.25.mlp.experts.81.gate_proj", "model.layers.25.mlp.experts.82.gate_proj", "model.layers.25.mlp.experts.83.gate_proj", "model.layers.25.mlp.experts.84.gate_proj", "model.layers.25.mlp.experts.85.gate_proj", "model.layers.25.mlp.experts.86.gate_proj", "model.layers.25.mlp.experts.87.gate_proj", "model.layers.25.mlp.experts.88.gate_proj", "model.layers.25.mlp.experts.89.gate_proj", "model.layers.25.mlp.experts.90.gate_proj", "model.layers.25.mlp.experts.91.gate_proj", "model.layers.25.mlp.experts.92.gate_proj", "model.layers.25.mlp.experts.93.gate_proj", "model.layers.25.mlp.experts.94.gate_proj", "model.layers.25.mlp.experts.95.gate_proj", "model.layers.25.mlp.experts.96.gate_proj", "model.layers.25.mlp.experts.97.gate_proj", "model.layers.25.mlp.experts.98.gate_proj", "model.layers.25.mlp.experts.99.gate_proj", "model.layers.25.mlp.experts.100.gate_proj", "model.layers.25.mlp.experts.101.gate_proj", "model.layers.25.mlp.experts.102.gate_proj", "model.layers.25.mlp.experts.103.gate_proj", "model.layers.25.mlp.experts.104.gate_proj", "model.layers.25.mlp.experts.105.gate_proj", "model.layers.25.mlp.experts.106.gate_proj", "model.layers.25.mlp.experts.107.gate_proj", "model.layers.25.mlp.experts.108.gate_proj", "model.layers.25.mlp.experts.109.gate_proj", "model.layers.25.mlp.experts.110.gate_proj", "model.layers.25.mlp.experts.111.gate_proj", "model.layers.25.mlp.experts.112.gate_proj", "model.layers.25.mlp.experts.113.gate_proj", "model.layers.25.mlp.experts.114.gate_proj", "model.layers.25.mlp.experts.115.gate_proj", "model.layers.25.mlp.experts.116.gate_proj", "model.layers.25.mlp.experts.117.gate_proj", "model.layers.25.mlp.experts.118.gate_proj", "model.layers.25.mlp.experts.119.gate_proj", "model.layers.25.mlp.experts.120.gate_proj", "model.layers.25.mlp.experts.121.gate_proj", "model.layers.25.mlp.experts.122.gate_proj", "model.layers.25.mlp.experts.123.gate_proj", "model.layers.25.mlp.experts.124.gate_proj", "model.layers.25.mlp.experts.125.gate_proj", "model.layers.25.mlp.experts.126.gate_proj", "model.layers.25.mlp.experts.127.gate_proj", "model.layers.25.mlp.experts.128.gate_proj", "model.layers.25.mlp.experts.129.gate_proj", "model.layers.25.mlp.experts.130.gate_proj", "model.layers.25.mlp.experts.131.gate_proj", "model.layers.25.mlp.experts.132.gate_proj", "model.layers.25.mlp.experts.133.gate_proj", "model.layers.25.mlp.experts.134.gate_proj", "model.layers.25.mlp.experts.135.gate_proj", "model.layers.25.mlp.experts.136.gate_proj", "model.layers.25.mlp.experts.137.gate_proj", "model.layers.25.mlp.experts.138.gate_proj", "model.layers.25.mlp.experts.139.gate_proj", "model.layers.25.mlp.experts.140.gate_proj", "model.layers.25.mlp.experts.141.gate_proj", "model.layers.25.mlp.experts.142.gate_proj", "model.layers.25.mlp.experts.143.gate_proj", "model.layers.25.mlp.experts.144.gate_proj", "model.layers.25.mlp.experts.145.gate_proj", "model.layers.25.mlp.experts.146.gate_proj", "model.layers.25.mlp.experts.147.gate_proj", "model.layers.25.mlp.experts.148.gate_proj", "model.layers.25.mlp.experts.149.gate_proj", "model.layers.25.mlp.experts.150.gate_proj", "model.layers.25.mlp.experts.151.gate_proj", "model.layers.25.mlp.experts.152.gate_proj", "model.layers.25.mlp.experts.153.gate_proj", "model.layers.25.mlp.experts.154.gate_proj", "model.layers.25.mlp.experts.155.gate_proj", "model.layers.25.mlp.experts.156.gate_proj", "model.layers.25.mlp.experts.157.gate_proj", "model.layers.25.mlp.experts.158.gate_proj", "model.layers.25.mlp.experts.159.gate_proj", "model.layers.25.mlp.experts.0.up_proj", "model.layers.25.mlp.experts.1.up_proj", "model.layers.25.mlp.experts.2.up_proj", "model.layers.25.mlp.experts.3.up_proj", "model.layers.25.mlp.experts.4.up_proj", "model.layers.25.mlp.experts.5.up_proj", "model.layers.25.mlp.experts.6.up_proj", "model.layers.25.mlp.experts.7.up_proj", "model.layers.25.mlp.experts.8.up_proj", "model.layers.25.mlp.experts.9.up_proj", "model.layers.25.mlp.experts.10.up_proj", "model.layers.25.mlp.experts.11.up_proj", "model.layers.25.mlp.experts.12.up_proj", "model.layers.25.mlp.experts.13.up_proj", "model.layers.25.mlp.experts.14.up_proj", "model.layers.25.mlp.experts.15.up_proj", "model.layers.25.mlp.experts.16.up_proj", "model.layers.25.mlp.experts.17.up_proj", "model.layers.25.mlp.experts.18.up_proj", "model.layers.25.mlp.experts.19.up_proj", "model.layers.25.mlp.experts.20.up_proj", "model.layers.25.mlp.experts.21.up_proj", "model.layers.25.mlp.experts.22.up_proj", "model.layers.25.mlp.experts.23.up_proj", "model.layers.25.mlp.experts.24.up_proj", "model.layers.25.mlp.experts.25.up_proj", "model.layers.25.mlp.experts.26.up_proj", "model.layers.25.mlp.experts.27.up_proj", "model.layers.25.mlp.experts.28.up_proj", "model.layers.25.mlp.experts.29.up_proj", "model.layers.25.mlp.experts.30.up_proj", "model.layers.25.mlp.experts.31.up_proj", "model.layers.25.mlp.experts.32.up_proj", "model.layers.25.mlp.experts.33.up_proj", "model.layers.25.mlp.experts.34.up_proj", "model.layers.25.mlp.experts.35.up_proj", "model.layers.25.mlp.experts.36.up_proj", "model.layers.25.mlp.experts.37.up_proj", "model.layers.25.mlp.experts.38.up_proj", "model.layers.25.mlp.experts.39.up_proj", "model.layers.25.mlp.experts.40.up_proj", "model.layers.25.mlp.experts.41.up_proj", "model.layers.25.mlp.experts.42.up_proj", "model.layers.25.mlp.experts.43.up_proj", "model.layers.25.mlp.experts.44.up_proj", "model.layers.25.mlp.experts.45.up_proj", "model.layers.25.mlp.experts.46.up_proj", "model.layers.25.mlp.experts.47.up_proj", "model.layers.25.mlp.experts.48.up_proj", "model.layers.25.mlp.experts.49.up_proj", "model.layers.25.mlp.experts.50.up_proj", "model.layers.25.mlp.experts.51.up_proj", "model.layers.25.mlp.experts.52.up_proj", "model.layers.25.mlp.experts.53.up_proj", "model.layers.25.mlp.experts.54.up_proj", "model.layers.25.mlp.experts.55.up_proj", "model.layers.25.mlp.experts.56.up_proj", "model.layers.25.mlp.experts.57.up_proj", "model.layers.25.mlp.experts.58.up_proj", "model.layers.25.mlp.experts.59.up_proj", "model.layers.25.mlp.experts.60.up_proj", "model.layers.25.mlp.experts.61.up_proj", "model.layers.25.mlp.experts.62.up_proj", "model.layers.25.mlp.experts.63.up_proj", "model.layers.25.mlp.experts.64.up_proj", "model.layers.25.mlp.experts.65.up_proj", "model.layers.25.mlp.experts.66.up_proj", "model.layers.25.mlp.experts.67.up_proj", "model.layers.25.mlp.experts.68.up_proj", "model.layers.25.mlp.experts.69.up_proj", "model.layers.25.mlp.experts.70.up_proj", "model.layers.25.mlp.experts.71.up_proj", "model.layers.25.mlp.experts.72.up_proj", "model.layers.25.mlp.experts.73.up_proj", "model.layers.25.mlp.experts.74.up_proj", "model.layers.25.mlp.experts.75.up_proj", "model.layers.25.mlp.experts.76.up_proj", "model.layers.25.mlp.experts.77.up_proj", "model.layers.25.mlp.experts.78.up_proj", "model.layers.25.mlp.experts.79.up_proj", "model.layers.25.mlp.experts.80.up_proj", "model.layers.25.mlp.experts.81.up_proj", "model.layers.25.mlp.experts.82.up_proj", "model.layers.25.mlp.experts.83.up_proj", "model.layers.25.mlp.experts.84.up_proj", "model.layers.25.mlp.experts.85.up_proj", "model.layers.25.mlp.experts.86.up_proj", "model.layers.25.mlp.experts.87.up_proj", "model.layers.25.mlp.experts.88.up_proj", "model.layers.25.mlp.experts.89.up_proj", "model.layers.25.mlp.experts.90.up_proj", "model.layers.25.mlp.experts.91.up_proj", "model.layers.25.mlp.experts.92.up_proj", "model.layers.25.mlp.experts.93.up_proj", "model.layers.25.mlp.experts.94.up_proj", "model.layers.25.mlp.experts.95.up_proj", "model.layers.25.mlp.experts.96.up_proj", "model.layers.25.mlp.experts.97.up_proj", "model.layers.25.mlp.experts.98.up_proj", "model.layers.25.mlp.experts.99.up_proj", "model.layers.25.mlp.experts.100.up_proj", "model.layers.25.mlp.experts.101.up_proj", "model.layers.25.mlp.experts.102.up_proj", "model.layers.25.mlp.experts.103.up_proj", "model.layers.25.mlp.experts.104.up_proj", "model.layers.25.mlp.experts.105.up_proj", "model.layers.25.mlp.experts.106.up_proj", "model.layers.25.mlp.experts.107.up_proj", "model.layers.25.mlp.experts.108.up_proj", "model.layers.25.mlp.experts.109.up_proj", "model.layers.25.mlp.experts.110.up_proj", "model.layers.25.mlp.experts.111.up_proj", "model.layers.25.mlp.experts.112.up_proj", "model.layers.25.mlp.experts.113.up_proj", "model.layers.25.mlp.experts.114.up_proj", "model.layers.25.mlp.experts.115.up_proj", "model.layers.25.mlp.experts.116.up_proj", "model.layers.25.mlp.experts.117.up_proj", "model.layers.25.mlp.experts.118.up_proj", "model.layers.25.mlp.experts.119.up_proj", "model.layers.25.mlp.experts.120.up_proj", "model.layers.25.mlp.experts.121.up_proj", "model.layers.25.mlp.experts.122.up_proj", "model.layers.25.mlp.experts.123.up_proj", "model.layers.25.mlp.experts.124.up_proj", "model.layers.25.mlp.experts.125.up_proj", "model.layers.25.mlp.experts.126.up_proj", "model.layers.25.mlp.experts.127.up_proj", "model.layers.25.mlp.experts.128.up_proj", "model.layers.25.mlp.experts.129.up_proj", "model.layers.25.mlp.experts.130.up_proj", "model.layers.25.mlp.experts.131.up_proj", "model.layers.25.mlp.experts.132.up_proj", "model.layers.25.mlp.experts.133.up_proj", "model.layers.25.mlp.experts.134.up_proj", "model.layers.25.mlp.experts.135.up_proj", "model.layers.25.mlp.experts.136.up_proj", "model.layers.25.mlp.experts.137.up_proj", "model.layers.25.mlp.experts.138.up_proj", "model.layers.25.mlp.experts.139.up_proj", "model.layers.25.mlp.experts.140.up_proj", "model.layers.25.mlp.experts.141.up_proj", "model.layers.25.mlp.experts.142.up_proj", "model.layers.25.mlp.experts.143.up_proj", "model.layers.25.mlp.experts.144.up_proj", "model.layers.25.mlp.experts.145.up_proj", "model.layers.25.mlp.experts.146.up_proj", "model.layers.25.mlp.experts.147.up_proj", "model.layers.25.mlp.experts.148.up_proj", "model.layers.25.mlp.experts.149.up_proj", "model.layers.25.mlp.experts.150.up_proj", "model.layers.25.mlp.experts.151.up_proj", "model.layers.25.mlp.experts.152.up_proj", "model.layers.25.mlp.experts.153.up_proj", "model.layers.25.mlp.experts.154.up_proj", "model.layers.25.mlp.experts.155.up_proj", "model.layers.25.mlp.experts.156.up_proj", "model.layers.25.mlp.experts.157.up_proj", "model.layers.25.mlp.experts.158.up_proj", "model.layers.25.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -7.75046879425631e-05, "dbits": 2516582400 }, { "dkld": -7.05417012795799e-05, "dbits": 5033164800 } ] }, { "idx": 152, "layers": [ "model.layers.25.mlp.experts.0.down_proj", "model.layers.25.mlp.experts.1.down_proj", "model.layers.25.mlp.experts.2.down_proj", "model.layers.25.mlp.experts.3.down_proj", "model.layers.25.mlp.experts.4.down_proj", "model.layers.25.mlp.experts.5.down_proj", "model.layers.25.mlp.experts.6.down_proj", "model.layers.25.mlp.experts.7.down_proj", "model.layers.25.mlp.experts.8.down_proj", "model.layers.25.mlp.experts.9.down_proj", "model.layers.25.mlp.experts.10.down_proj", "model.layers.25.mlp.experts.11.down_proj", "model.layers.25.mlp.experts.12.down_proj", "model.layers.25.mlp.experts.13.down_proj", "model.layers.25.mlp.experts.14.down_proj", "model.layers.25.mlp.experts.15.down_proj", "model.layers.25.mlp.experts.16.down_proj", "model.layers.25.mlp.experts.17.down_proj", "model.layers.25.mlp.experts.18.down_proj", "model.layers.25.mlp.experts.19.down_proj", "model.layers.25.mlp.experts.20.down_proj", "model.layers.25.mlp.experts.21.down_proj", "model.layers.25.mlp.experts.22.down_proj", "model.layers.25.mlp.experts.23.down_proj", "model.layers.25.mlp.experts.24.down_proj", "model.layers.25.mlp.experts.25.down_proj", "model.layers.25.mlp.experts.26.down_proj", "model.layers.25.mlp.experts.27.down_proj", "model.layers.25.mlp.experts.28.down_proj", "model.layers.25.mlp.experts.29.down_proj", "model.layers.25.mlp.experts.30.down_proj", "model.layers.25.mlp.experts.31.down_proj", "model.layers.25.mlp.experts.32.down_proj", "model.layers.25.mlp.experts.33.down_proj", "model.layers.25.mlp.experts.34.down_proj", "model.layers.25.mlp.experts.35.down_proj", "model.layers.25.mlp.experts.36.down_proj", "model.layers.25.mlp.experts.37.down_proj", "model.layers.25.mlp.experts.38.down_proj", "model.layers.25.mlp.experts.39.down_proj", "model.layers.25.mlp.experts.40.down_proj", "model.layers.25.mlp.experts.41.down_proj", "model.layers.25.mlp.experts.42.down_proj", "model.layers.25.mlp.experts.43.down_proj", "model.layers.25.mlp.experts.44.down_proj", "model.layers.25.mlp.experts.45.down_proj", "model.layers.25.mlp.experts.46.down_proj", "model.layers.25.mlp.experts.47.down_proj", "model.layers.25.mlp.experts.48.down_proj", "model.layers.25.mlp.experts.49.down_proj", "model.layers.25.mlp.experts.50.down_proj", "model.layers.25.mlp.experts.51.down_proj", "model.layers.25.mlp.experts.52.down_proj", "model.layers.25.mlp.experts.53.down_proj", "model.layers.25.mlp.experts.54.down_proj", "model.layers.25.mlp.experts.55.down_proj", "model.layers.25.mlp.experts.56.down_proj", "model.layers.25.mlp.experts.57.down_proj", "model.layers.25.mlp.experts.58.down_proj", "model.layers.25.mlp.experts.59.down_proj", "model.layers.25.mlp.experts.60.down_proj", "model.layers.25.mlp.experts.61.down_proj", "model.layers.25.mlp.experts.62.down_proj", "model.layers.25.mlp.experts.63.down_proj", "model.layers.25.mlp.experts.64.down_proj", "model.layers.25.mlp.experts.65.down_proj", "model.layers.25.mlp.experts.66.down_proj", "model.layers.25.mlp.experts.67.down_proj", "model.layers.25.mlp.experts.68.down_proj", "model.layers.25.mlp.experts.69.down_proj", "model.layers.25.mlp.experts.70.down_proj", "model.layers.25.mlp.experts.71.down_proj", "model.layers.25.mlp.experts.72.down_proj", "model.layers.25.mlp.experts.73.down_proj", "model.layers.25.mlp.experts.74.down_proj", "model.layers.25.mlp.experts.75.down_proj", "model.layers.25.mlp.experts.76.down_proj", "model.layers.25.mlp.experts.77.down_proj", "model.layers.25.mlp.experts.78.down_proj", "model.layers.25.mlp.experts.79.down_proj", "model.layers.25.mlp.experts.80.down_proj", "model.layers.25.mlp.experts.81.down_proj", "model.layers.25.mlp.experts.82.down_proj", "model.layers.25.mlp.experts.83.down_proj", "model.layers.25.mlp.experts.84.down_proj", "model.layers.25.mlp.experts.85.down_proj", "model.layers.25.mlp.experts.86.down_proj", "model.layers.25.mlp.experts.87.down_proj", "model.layers.25.mlp.experts.88.down_proj", "model.layers.25.mlp.experts.89.down_proj", "model.layers.25.mlp.experts.90.down_proj", "model.layers.25.mlp.experts.91.down_proj", "model.layers.25.mlp.experts.92.down_proj", "model.layers.25.mlp.experts.93.down_proj", "model.layers.25.mlp.experts.94.down_proj", "model.layers.25.mlp.experts.95.down_proj", "model.layers.25.mlp.experts.96.down_proj", "model.layers.25.mlp.experts.97.down_proj", "model.layers.25.mlp.experts.98.down_proj", "model.layers.25.mlp.experts.99.down_proj", "model.layers.25.mlp.experts.100.down_proj", "model.layers.25.mlp.experts.101.down_proj", "model.layers.25.mlp.experts.102.down_proj", "model.layers.25.mlp.experts.103.down_proj", "model.layers.25.mlp.experts.104.down_proj", "model.layers.25.mlp.experts.105.down_proj", "model.layers.25.mlp.experts.106.down_proj", "model.layers.25.mlp.experts.107.down_proj", "model.layers.25.mlp.experts.108.down_proj", "model.layers.25.mlp.experts.109.down_proj", "model.layers.25.mlp.experts.110.down_proj", "model.layers.25.mlp.experts.111.down_proj", "model.layers.25.mlp.experts.112.down_proj", "model.layers.25.mlp.experts.113.down_proj", "model.layers.25.mlp.experts.114.down_proj", "model.layers.25.mlp.experts.115.down_proj", "model.layers.25.mlp.experts.116.down_proj", "model.layers.25.mlp.experts.117.down_proj", "model.layers.25.mlp.experts.118.down_proj", "model.layers.25.mlp.experts.119.down_proj", "model.layers.25.mlp.experts.120.down_proj", "model.layers.25.mlp.experts.121.down_proj", "model.layers.25.mlp.experts.122.down_proj", "model.layers.25.mlp.experts.123.down_proj", "model.layers.25.mlp.experts.124.down_proj", "model.layers.25.mlp.experts.125.down_proj", "model.layers.25.mlp.experts.126.down_proj", "model.layers.25.mlp.experts.127.down_proj", "model.layers.25.mlp.experts.128.down_proj", "model.layers.25.mlp.experts.129.down_proj", "model.layers.25.mlp.experts.130.down_proj", "model.layers.25.mlp.experts.131.down_proj", "model.layers.25.mlp.experts.132.down_proj", "model.layers.25.mlp.experts.133.down_proj", "model.layers.25.mlp.experts.134.down_proj", "model.layers.25.mlp.experts.135.down_proj", "model.layers.25.mlp.experts.136.down_proj", "model.layers.25.mlp.experts.137.down_proj", "model.layers.25.mlp.experts.138.down_proj", "model.layers.25.mlp.experts.139.down_proj", "model.layers.25.mlp.experts.140.down_proj", "model.layers.25.mlp.experts.141.down_proj", "model.layers.25.mlp.experts.142.down_proj", "model.layers.25.mlp.experts.143.down_proj", "model.layers.25.mlp.experts.144.down_proj", "model.layers.25.mlp.experts.145.down_proj", "model.layers.25.mlp.experts.146.down_proj", "model.layers.25.mlp.experts.147.down_proj", "model.layers.25.mlp.experts.148.down_proj", "model.layers.25.mlp.experts.149.down_proj", "model.layers.25.mlp.experts.150.down_proj", "model.layers.25.mlp.experts.151.down_proj", "model.layers.25.mlp.experts.152.down_proj", "model.layers.25.mlp.experts.153.down_proj", "model.layers.25.mlp.experts.154.down_proj", "model.layers.25.mlp.experts.155.down_proj", "model.layers.25.mlp.experts.156.down_proj", "model.layers.25.mlp.experts.157.down_proj", "model.layers.25.mlp.experts.158.down_proj", "model.layers.25.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -3.4016463905571503e-05, "dbits": 1258291200 }, { "dkld": -1.690853387117247e-05, "dbits": 2516582400 } ] }, { "idx": 153, "layers": [ "model.layers.26.self_attn.q_proj" ], "candidates": [ { "dkld": -1.0287691839038632e-05, "dbits": 62914560 }, { "dkld": -7.060430943965808e-05, "dbits": 125829120 } ] }, { "idx": 154, "layers": [ "model.layers.26.self_attn.k_proj", "model.layers.26.self_attn.v_proj" ], "candidates": [ { "dkld": -0.00013461676426231722, "dbits": 10485760 }, { "dkld": -0.00021653075236827135, "dbits": 20971520 } ] }, { "idx": 155, "layers": [ "model.layers.26.self_attn.o_proj" ], "candidates": [ { "dkld": -0.00023278440348803962, "dbits": 62914560 }, { "dkld": -0.00020531699992716243, "dbits": 125829120 } ] }, { "idx": 156, "layers": [ "model.layers.26.mlp.shared_experts.gate_proj", "model.layers.26.mlp.shared_experts.up_proj", "model.layers.26.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -3.5364413633942604e-05, "dbits": 23592960 }, { "dkld": -6.0412799939513206e-05, "dbits": 47185920 } ] }, { "idx": 157, "layers": [ "model.layers.26.mlp.experts.0.gate_proj", "model.layers.26.mlp.experts.1.gate_proj", "model.layers.26.mlp.experts.2.gate_proj", "model.layers.26.mlp.experts.3.gate_proj", "model.layers.26.mlp.experts.4.gate_proj", "model.layers.26.mlp.experts.5.gate_proj", "model.layers.26.mlp.experts.6.gate_proj", "model.layers.26.mlp.experts.7.gate_proj", "model.layers.26.mlp.experts.8.gate_proj", "model.layers.26.mlp.experts.9.gate_proj", "model.layers.26.mlp.experts.10.gate_proj", "model.layers.26.mlp.experts.11.gate_proj", "model.layers.26.mlp.experts.12.gate_proj", "model.layers.26.mlp.experts.13.gate_proj", "model.layers.26.mlp.experts.14.gate_proj", "model.layers.26.mlp.experts.15.gate_proj", "model.layers.26.mlp.experts.16.gate_proj", "model.layers.26.mlp.experts.17.gate_proj", "model.layers.26.mlp.experts.18.gate_proj", "model.layers.26.mlp.experts.19.gate_proj", "model.layers.26.mlp.experts.20.gate_proj", "model.layers.26.mlp.experts.21.gate_proj", "model.layers.26.mlp.experts.22.gate_proj", "model.layers.26.mlp.experts.23.gate_proj", "model.layers.26.mlp.experts.24.gate_proj", "model.layers.26.mlp.experts.25.gate_proj", "model.layers.26.mlp.experts.26.gate_proj", "model.layers.26.mlp.experts.27.gate_proj", "model.layers.26.mlp.experts.28.gate_proj", "model.layers.26.mlp.experts.29.gate_proj", "model.layers.26.mlp.experts.30.gate_proj", "model.layers.26.mlp.experts.31.gate_proj", "model.layers.26.mlp.experts.32.gate_proj", "model.layers.26.mlp.experts.33.gate_proj", "model.layers.26.mlp.experts.34.gate_proj", "model.layers.26.mlp.experts.35.gate_proj", "model.layers.26.mlp.experts.36.gate_proj", "model.layers.26.mlp.experts.37.gate_proj", "model.layers.26.mlp.experts.38.gate_proj", "model.layers.26.mlp.experts.39.gate_proj", "model.layers.26.mlp.experts.40.gate_proj", "model.layers.26.mlp.experts.41.gate_proj", "model.layers.26.mlp.experts.42.gate_proj", "model.layers.26.mlp.experts.43.gate_proj", "model.layers.26.mlp.experts.44.gate_proj", "model.layers.26.mlp.experts.45.gate_proj", "model.layers.26.mlp.experts.46.gate_proj", "model.layers.26.mlp.experts.47.gate_proj", "model.layers.26.mlp.experts.48.gate_proj", "model.layers.26.mlp.experts.49.gate_proj", "model.layers.26.mlp.experts.50.gate_proj", "model.layers.26.mlp.experts.51.gate_proj", "model.layers.26.mlp.experts.52.gate_proj", "model.layers.26.mlp.experts.53.gate_proj", "model.layers.26.mlp.experts.54.gate_proj", "model.layers.26.mlp.experts.55.gate_proj", "model.layers.26.mlp.experts.56.gate_proj", "model.layers.26.mlp.experts.57.gate_proj", "model.layers.26.mlp.experts.58.gate_proj", "model.layers.26.mlp.experts.59.gate_proj", "model.layers.26.mlp.experts.60.gate_proj", "model.layers.26.mlp.experts.61.gate_proj", "model.layers.26.mlp.experts.62.gate_proj", "model.layers.26.mlp.experts.63.gate_proj", "model.layers.26.mlp.experts.64.gate_proj", "model.layers.26.mlp.experts.65.gate_proj", "model.layers.26.mlp.experts.66.gate_proj", "model.layers.26.mlp.experts.67.gate_proj", "model.layers.26.mlp.experts.68.gate_proj", "model.layers.26.mlp.experts.69.gate_proj", "model.layers.26.mlp.experts.70.gate_proj", "model.layers.26.mlp.experts.71.gate_proj", "model.layers.26.mlp.experts.72.gate_proj", "model.layers.26.mlp.experts.73.gate_proj", "model.layers.26.mlp.experts.74.gate_proj", "model.layers.26.mlp.experts.75.gate_proj", "model.layers.26.mlp.experts.76.gate_proj", "model.layers.26.mlp.experts.77.gate_proj", "model.layers.26.mlp.experts.78.gate_proj", "model.layers.26.mlp.experts.79.gate_proj", "model.layers.26.mlp.experts.80.gate_proj", "model.layers.26.mlp.experts.81.gate_proj", "model.layers.26.mlp.experts.82.gate_proj", "model.layers.26.mlp.experts.83.gate_proj", "model.layers.26.mlp.experts.84.gate_proj", "model.layers.26.mlp.experts.85.gate_proj", "model.layers.26.mlp.experts.86.gate_proj", "model.layers.26.mlp.experts.87.gate_proj", "model.layers.26.mlp.experts.88.gate_proj", "model.layers.26.mlp.experts.89.gate_proj", "model.layers.26.mlp.experts.90.gate_proj", "model.layers.26.mlp.experts.91.gate_proj", "model.layers.26.mlp.experts.92.gate_proj", "model.layers.26.mlp.experts.93.gate_proj", "model.layers.26.mlp.experts.94.gate_proj", "model.layers.26.mlp.experts.95.gate_proj", "model.layers.26.mlp.experts.96.gate_proj", "model.layers.26.mlp.experts.97.gate_proj", "model.layers.26.mlp.experts.98.gate_proj", "model.layers.26.mlp.experts.99.gate_proj", "model.layers.26.mlp.experts.100.gate_proj", "model.layers.26.mlp.experts.101.gate_proj", "model.layers.26.mlp.experts.102.gate_proj", "model.layers.26.mlp.experts.103.gate_proj", "model.layers.26.mlp.experts.104.gate_proj", "model.layers.26.mlp.experts.105.gate_proj", "model.layers.26.mlp.experts.106.gate_proj", "model.layers.26.mlp.experts.107.gate_proj", "model.layers.26.mlp.experts.108.gate_proj", "model.layers.26.mlp.experts.109.gate_proj", "model.layers.26.mlp.experts.110.gate_proj", "model.layers.26.mlp.experts.111.gate_proj", "model.layers.26.mlp.experts.112.gate_proj", "model.layers.26.mlp.experts.113.gate_proj", "model.layers.26.mlp.experts.114.gate_proj", "model.layers.26.mlp.experts.115.gate_proj", "model.layers.26.mlp.experts.116.gate_proj", "model.layers.26.mlp.experts.117.gate_proj", "model.layers.26.mlp.experts.118.gate_proj", "model.layers.26.mlp.experts.119.gate_proj", "model.layers.26.mlp.experts.120.gate_proj", "model.layers.26.mlp.experts.121.gate_proj", "model.layers.26.mlp.experts.122.gate_proj", "model.layers.26.mlp.experts.123.gate_proj", "model.layers.26.mlp.experts.124.gate_proj", "model.layers.26.mlp.experts.125.gate_proj", "model.layers.26.mlp.experts.126.gate_proj", "model.layers.26.mlp.experts.127.gate_proj", "model.layers.26.mlp.experts.128.gate_proj", "model.layers.26.mlp.experts.129.gate_proj", "model.layers.26.mlp.experts.130.gate_proj", "model.layers.26.mlp.experts.131.gate_proj", "model.layers.26.mlp.experts.132.gate_proj", "model.layers.26.mlp.experts.133.gate_proj", "model.layers.26.mlp.experts.134.gate_proj", "model.layers.26.mlp.experts.135.gate_proj", "model.layers.26.mlp.experts.136.gate_proj", "model.layers.26.mlp.experts.137.gate_proj", "model.layers.26.mlp.experts.138.gate_proj", "model.layers.26.mlp.experts.139.gate_proj", "model.layers.26.mlp.experts.140.gate_proj", "model.layers.26.mlp.experts.141.gate_proj", "model.layers.26.mlp.experts.142.gate_proj", "model.layers.26.mlp.experts.143.gate_proj", "model.layers.26.mlp.experts.144.gate_proj", "model.layers.26.mlp.experts.145.gate_proj", "model.layers.26.mlp.experts.146.gate_proj", "model.layers.26.mlp.experts.147.gate_proj", "model.layers.26.mlp.experts.148.gate_proj", "model.layers.26.mlp.experts.149.gate_proj", "model.layers.26.mlp.experts.150.gate_proj", "model.layers.26.mlp.experts.151.gate_proj", "model.layers.26.mlp.experts.152.gate_proj", "model.layers.26.mlp.experts.153.gate_proj", "model.layers.26.mlp.experts.154.gate_proj", "model.layers.26.mlp.experts.155.gate_proj", "model.layers.26.mlp.experts.156.gate_proj", "model.layers.26.mlp.experts.157.gate_proj", "model.layers.26.mlp.experts.158.gate_proj", "model.layers.26.mlp.experts.159.gate_proj", "model.layers.26.mlp.experts.0.up_proj", "model.layers.26.mlp.experts.1.up_proj", "model.layers.26.mlp.experts.2.up_proj", "model.layers.26.mlp.experts.3.up_proj", "model.layers.26.mlp.experts.4.up_proj", "model.layers.26.mlp.experts.5.up_proj", "model.layers.26.mlp.experts.6.up_proj", "model.layers.26.mlp.experts.7.up_proj", "model.layers.26.mlp.experts.8.up_proj", "model.layers.26.mlp.experts.9.up_proj", "model.layers.26.mlp.experts.10.up_proj", "model.layers.26.mlp.experts.11.up_proj", "model.layers.26.mlp.experts.12.up_proj", "model.layers.26.mlp.experts.13.up_proj", "model.layers.26.mlp.experts.14.up_proj", "model.layers.26.mlp.experts.15.up_proj", "model.layers.26.mlp.experts.16.up_proj", "model.layers.26.mlp.experts.17.up_proj", "model.layers.26.mlp.experts.18.up_proj", "model.layers.26.mlp.experts.19.up_proj", "model.layers.26.mlp.experts.20.up_proj", "model.layers.26.mlp.experts.21.up_proj", "model.layers.26.mlp.experts.22.up_proj", "model.layers.26.mlp.experts.23.up_proj", "model.layers.26.mlp.experts.24.up_proj", "model.layers.26.mlp.experts.25.up_proj", "model.layers.26.mlp.experts.26.up_proj", "model.layers.26.mlp.experts.27.up_proj", "model.layers.26.mlp.experts.28.up_proj", "model.layers.26.mlp.experts.29.up_proj", "model.layers.26.mlp.experts.30.up_proj", "model.layers.26.mlp.experts.31.up_proj", "model.layers.26.mlp.experts.32.up_proj", "model.layers.26.mlp.experts.33.up_proj", "model.layers.26.mlp.experts.34.up_proj", "model.layers.26.mlp.experts.35.up_proj", "model.layers.26.mlp.experts.36.up_proj", "model.layers.26.mlp.experts.37.up_proj", "model.layers.26.mlp.experts.38.up_proj", "model.layers.26.mlp.experts.39.up_proj", "model.layers.26.mlp.experts.40.up_proj", "model.layers.26.mlp.experts.41.up_proj", "model.layers.26.mlp.experts.42.up_proj", "model.layers.26.mlp.experts.43.up_proj", "model.layers.26.mlp.experts.44.up_proj", "model.layers.26.mlp.experts.45.up_proj", "model.layers.26.mlp.experts.46.up_proj", "model.layers.26.mlp.experts.47.up_proj", "model.layers.26.mlp.experts.48.up_proj", "model.layers.26.mlp.experts.49.up_proj", "model.layers.26.mlp.experts.50.up_proj", "model.layers.26.mlp.experts.51.up_proj", "model.layers.26.mlp.experts.52.up_proj", "model.layers.26.mlp.experts.53.up_proj", "model.layers.26.mlp.experts.54.up_proj", "model.layers.26.mlp.experts.55.up_proj", "model.layers.26.mlp.experts.56.up_proj", "model.layers.26.mlp.experts.57.up_proj", "model.layers.26.mlp.experts.58.up_proj", "model.layers.26.mlp.experts.59.up_proj", "model.layers.26.mlp.experts.60.up_proj", "model.layers.26.mlp.experts.61.up_proj", "model.layers.26.mlp.experts.62.up_proj", "model.layers.26.mlp.experts.63.up_proj", "model.layers.26.mlp.experts.64.up_proj", "model.layers.26.mlp.experts.65.up_proj", "model.layers.26.mlp.experts.66.up_proj", "model.layers.26.mlp.experts.67.up_proj", "model.layers.26.mlp.experts.68.up_proj", "model.layers.26.mlp.experts.69.up_proj", "model.layers.26.mlp.experts.70.up_proj", "model.layers.26.mlp.experts.71.up_proj", "model.layers.26.mlp.experts.72.up_proj", "model.layers.26.mlp.experts.73.up_proj", "model.layers.26.mlp.experts.74.up_proj", "model.layers.26.mlp.experts.75.up_proj", "model.layers.26.mlp.experts.76.up_proj", "model.layers.26.mlp.experts.77.up_proj", "model.layers.26.mlp.experts.78.up_proj", "model.layers.26.mlp.experts.79.up_proj", "model.layers.26.mlp.experts.80.up_proj", "model.layers.26.mlp.experts.81.up_proj", "model.layers.26.mlp.experts.82.up_proj", "model.layers.26.mlp.experts.83.up_proj", "model.layers.26.mlp.experts.84.up_proj", "model.layers.26.mlp.experts.85.up_proj", "model.layers.26.mlp.experts.86.up_proj", "model.layers.26.mlp.experts.87.up_proj", "model.layers.26.mlp.experts.88.up_proj", "model.layers.26.mlp.experts.89.up_proj", "model.layers.26.mlp.experts.90.up_proj", "model.layers.26.mlp.experts.91.up_proj", "model.layers.26.mlp.experts.92.up_proj", "model.layers.26.mlp.experts.93.up_proj", "model.layers.26.mlp.experts.94.up_proj", "model.layers.26.mlp.experts.95.up_proj", "model.layers.26.mlp.experts.96.up_proj", "model.layers.26.mlp.experts.97.up_proj", "model.layers.26.mlp.experts.98.up_proj", "model.layers.26.mlp.experts.99.up_proj", "model.layers.26.mlp.experts.100.up_proj", "model.layers.26.mlp.experts.101.up_proj", "model.layers.26.mlp.experts.102.up_proj", "model.layers.26.mlp.experts.103.up_proj", "model.layers.26.mlp.experts.104.up_proj", "model.layers.26.mlp.experts.105.up_proj", "model.layers.26.mlp.experts.106.up_proj", "model.layers.26.mlp.experts.107.up_proj", "model.layers.26.mlp.experts.108.up_proj", "model.layers.26.mlp.experts.109.up_proj", "model.layers.26.mlp.experts.110.up_proj", "model.layers.26.mlp.experts.111.up_proj", "model.layers.26.mlp.experts.112.up_proj", "model.layers.26.mlp.experts.113.up_proj", "model.layers.26.mlp.experts.114.up_proj", "model.layers.26.mlp.experts.115.up_proj", "model.layers.26.mlp.experts.116.up_proj", "model.layers.26.mlp.experts.117.up_proj", "model.layers.26.mlp.experts.118.up_proj", "model.layers.26.mlp.experts.119.up_proj", "model.layers.26.mlp.experts.120.up_proj", "model.layers.26.mlp.experts.121.up_proj", "model.layers.26.mlp.experts.122.up_proj", "model.layers.26.mlp.experts.123.up_proj", "model.layers.26.mlp.experts.124.up_proj", "model.layers.26.mlp.experts.125.up_proj", "model.layers.26.mlp.experts.126.up_proj", "model.layers.26.mlp.experts.127.up_proj", "model.layers.26.mlp.experts.128.up_proj", "model.layers.26.mlp.experts.129.up_proj", "model.layers.26.mlp.experts.130.up_proj", "model.layers.26.mlp.experts.131.up_proj", "model.layers.26.mlp.experts.132.up_proj", "model.layers.26.mlp.experts.133.up_proj", "model.layers.26.mlp.experts.134.up_proj", "model.layers.26.mlp.experts.135.up_proj", "model.layers.26.mlp.experts.136.up_proj", "model.layers.26.mlp.experts.137.up_proj", "model.layers.26.mlp.experts.138.up_proj", "model.layers.26.mlp.experts.139.up_proj", "model.layers.26.mlp.experts.140.up_proj", "model.layers.26.mlp.experts.141.up_proj", "model.layers.26.mlp.experts.142.up_proj", "model.layers.26.mlp.experts.143.up_proj", "model.layers.26.mlp.experts.144.up_proj", "model.layers.26.mlp.experts.145.up_proj", "model.layers.26.mlp.experts.146.up_proj", "model.layers.26.mlp.experts.147.up_proj", "model.layers.26.mlp.experts.148.up_proj", "model.layers.26.mlp.experts.149.up_proj", "model.layers.26.mlp.experts.150.up_proj", "model.layers.26.mlp.experts.151.up_proj", "model.layers.26.mlp.experts.152.up_proj", "model.layers.26.mlp.experts.153.up_proj", "model.layers.26.mlp.experts.154.up_proj", "model.layers.26.mlp.experts.155.up_proj", "model.layers.26.mlp.experts.156.up_proj", "model.layers.26.mlp.experts.157.up_proj", "model.layers.26.mlp.experts.158.up_proj", "model.layers.26.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -4.659094847738604e-05, "dbits": 2516582400 }, { "dkld": -6.255093030631438e-05, "dbits": 5033164800 } ] }, { "idx": 158, "layers": [ "model.layers.26.mlp.experts.0.down_proj", "model.layers.26.mlp.experts.1.down_proj", "model.layers.26.mlp.experts.2.down_proj", "model.layers.26.mlp.experts.3.down_proj", "model.layers.26.mlp.experts.4.down_proj", "model.layers.26.mlp.experts.5.down_proj", "model.layers.26.mlp.experts.6.down_proj", "model.layers.26.mlp.experts.7.down_proj", "model.layers.26.mlp.experts.8.down_proj", "model.layers.26.mlp.experts.9.down_proj", "model.layers.26.mlp.experts.10.down_proj", "model.layers.26.mlp.experts.11.down_proj", "model.layers.26.mlp.experts.12.down_proj", "model.layers.26.mlp.experts.13.down_proj", "model.layers.26.mlp.experts.14.down_proj", "model.layers.26.mlp.experts.15.down_proj", "model.layers.26.mlp.experts.16.down_proj", "model.layers.26.mlp.experts.17.down_proj", "model.layers.26.mlp.experts.18.down_proj", "model.layers.26.mlp.experts.19.down_proj", "model.layers.26.mlp.experts.20.down_proj", "model.layers.26.mlp.experts.21.down_proj", "model.layers.26.mlp.experts.22.down_proj", "model.layers.26.mlp.experts.23.down_proj", "model.layers.26.mlp.experts.24.down_proj", "model.layers.26.mlp.experts.25.down_proj", "model.layers.26.mlp.experts.26.down_proj", "model.layers.26.mlp.experts.27.down_proj", "model.layers.26.mlp.experts.28.down_proj", "model.layers.26.mlp.experts.29.down_proj", "model.layers.26.mlp.experts.30.down_proj", "model.layers.26.mlp.experts.31.down_proj", "model.layers.26.mlp.experts.32.down_proj", "model.layers.26.mlp.experts.33.down_proj", "model.layers.26.mlp.experts.34.down_proj", "model.layers.26.mlp.experts.35.down_proj", "model.layers.26.mlp.experts.36.down_proj", "model.layers.26.mlp.experts.37.down_proj", "model.layers.26.mlp.experts.38.down_proj", "model.layers.26.mlp.experts.39.down_proj", "model.layers.26.mlp.experts.40.down_proj", "model.layers.26.mlp.experts.41.down_proj", "model.layers.26.mlp.experts.42.down_proj", "model.layers.26.mlp.experts.43.down_proj", "model.layers.26.mlp.experts.44.down_proj", "model.layers.26.mlp.experts.45.down_proj", "model.layers.26.mlp.experts.46.down_proj", "model.layers.26.mlp.experts.47.down_proj", "model.layers.26.mlp.experts.48.down_proj", "model.layers.26.mlp.experts.49.down_proj", "model.layers.26.mlp.experts.50.down_proj", "model.layers.26.mlp.experts.51.down_proj", "model.layers.26.mlp.experts.52.down_proj", "model.layers.26.mlp.experts.53.down_proj", "model.layers.26.mlp.experts.54.down_proj", "model.layers.26.mlp.experts.55.down_proj", "model.layers.26.mlp.experts.56.down_proj", "model.layers.26.mlp.experts.57.down_proj", "model.layers.26.mlp.experts.58.down_proj", "model.layers.26.mlp.experts.59.down_proj", "model.layers.26.mlp.experts.60.down_proj", "model.layers.26.mlp.experts.61.down_proj", "model.layers.26.mlp.experts.62.down_proj", "model.layers.26.mlp.experts.63.down_proj", "model.layers.26.mlp.experts.64.down_proj", "model.layers.26.mlp.experts.65.down_proj", "model.layers.26.mlp.experts.66.down_proj", "model.layers.26.mlp.experts.67.down_proj", "model.layers.26.mlp.experts.68.down_proj", "model.layers.26.mlp.experts.69.down_proj", "model.layers.26.mlp.experts.70.down_proj", "model.layers.26.mlp.experts.71.down_proj", "model.layers.26.mlp.experts.72.down_proj", "model.layers.26.mlp.experts.73.down_proj", "model.layers.26.mlp.experts.74.down_proj", "model.layers.26.mlp.experts.75.down_proj", "model.layers.26.mlp.experts.76.down_proj", "model.layers.26.mlp.experts.77.down_proj", "model.layers.26.mlp.experts.78.down_proj", "model.layers.26.mlp.experts.79.down_proj", "model.layers.26.mlp.experts.80.down_proj", "model.layers.26.mlp.experts.81.down_proj", "model.layers.26.mlp.experts.82.down_proj", "model.layers.26.mlp.experts.83.down_proj", "model.layers.26.mlp.experts.84.down_proj", "model.layers.26.mlp.experts.85.down_proj", "model.layers.26.mlp.experts.86.down_proj", "model.layers.26.mlp.experts.87.down_proj", "model.layers.26.mlp.experts.88.down_proj", "model.layers.26.mlp.experts.89.down_proj", "model.layers.26.mlp.experts.90.down_proj", "model.layers.26.mlp.experts.91.down_proj", "model.layers.26.mlp.experts.92.down_proj", "model.layers.26.mlp.experts.93.down_proj", "model.layers.26.mlp.experts.94.down_proj", "model.layers.26.mlp.experts.95.down_proj", "model.layers.26.mlp.experts.96.down_proj", "model.layers.26.mlp.experts.97.down_proj", "model.layers.26.mlp.experts.98.down_proj", "model.layers.26.mlp.experts.99.down_proj", "model.layers.26.mlp.experts.100.down_proj", "model.layers.26.mlp.experts.101.down_proj", "model.layers.26.mlp.experts.102.down_proj", "model.layers.26.mlp.experts.103.down_proj", "model.layers.26.mlp.experts.104.down_proj", "model.layers.26.mlp.experts.105.down_proj", "model.layers.26.mlp.experts.106.down_proj", "model.layers.26.mlp.experts.107.down_proj", "model.layers.26.mlp.experts.108.down_proj", "model.layers.26.mlp.experts.109.down_proj", "model.layers.26.mlp.experts.110.down_proj", "model.layers.26.mlp.experts.111.down_proj", "model.layers.26.mlp.experts.112.down_proj", "model.layers.26.mlp.experts.113.down_proj", "model.layers.26.mlp.experts.114.down_proj", "model.layers.26.mlp.experts.115.down_proj", "model.layers.26.mlp.experts.116.down_proj", "model.layers.26.mlp.experts.117.down_proj", "model.layers.26.mlp.experts.118.down_proj", "model.layers.26.mlp.experts.119.down_proj", "model.layers.26.mlp.experts.120.down_proj", "model.layers.26.mlp.experts.121.down_proj", "model.layers.26.mlp.experts.122.down_proj", "model.layers.26.mlp.experts.123.down_proj", "model.layers.26.mlp.experts.124.down_proj", "model.layers.26.mlp.experts.125.down_proj", "model.layers.26.mlp.experts.126.down_proj", "model.layers.26.mlp.experts.127.down_proj", "model.layers.26.mlp.experts.128.down_proj", "model.layers.26.mlp.experts.129.down_proj", "model.layers.26.mlp.experts.130.down_proj", "model.layers.26.mlp.experts.131.down_proj", "model.layers.26.mlp.experts.132.down_proj", "model.layers.26.mlp.experts.133.down_proj", "model.layers.26.mlp.experts.134.down_proj", "model.layers.26.mlp.experts.135.down_proj", "model.layers.26.mlp.experts.136.down_proj", "model.layers.26.mlp.experts.137.down_proj", "model.layers.26.mlp.experts.138.down_proj", "model.layers.26.mlp.experts.139.down_proj", "model.layers.26.mlp.experts.140.down_proj", "model.layers.26.mlp.experts.141.down_proj", "model.layers.26.mlp.experts.142.down_proj", "model.layers.26.mlp.experts.143.down_proj", "model.layers.26.mlp.experts.144.down_proj", "model.layers.26.mlp.experts.145.down_proj", "model.layers.26.mlp.experts.146.down_proj", "model.layers.26.mlp.experts.147.down_proj", "model.layers.26.mlp.experts.148.down_proj", "model.layers.26.mlp.experts.149.down_proj", "model.layers.26.mlp.experts.150.down_proj", "model.layers.26.mlp.experts.151.down_proj", "model.layers.26.mlp.experts.152.down_proj", "model.layers.26.mlp.experts.153.down_proj", "model.layers.26.mlp.experts.154.down_proj", "model.layers.26.mlp.experts.155.down_proj", "model.layers.26.mlp.experts.156.down_proj", "model.layers.26.mlp.experts.157.down_proj", "model.layers.26.mlp.experts.158.down_proj", "model.layers.26.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -4.219543188809655e-06, "dbits": 1258291200 }, { "dkld": -3.606486134231056e-05, "dbits": 2516582400 } ] }, { "idx": 159, "layers": [ "model.layers.27.self_attn.q_proj" ], "candidates": [ { "dkld": 4.1788979433477966e-05, "dbits": 62914560 }, { "dkld": -1.879418268799747e-05, "dbits": 125829120 } ] }, { "idx": 160, "layers": [ "model.layers.27.self_attn.k_proj", "model.layers.27.self_attn.v_proj" ], "candidates": [ { "dkld": -2.967840991914203e-05, "dbits": 10485760 }, { "dkld": -8.268328383563908e-06, "dbits": 20971520 } ] }, { "idx": 161, "layers": [ "model.layers.27.self_attn.o_proj" ], "candidates": [ { "dkld": -3.69271729141335e-06, "dbits": 62914560 }, { "dkld": -0.0001259152544662353, "dbits": 125829120 } ] }, { "idx": 162, "layers": [ "model.layers.27.mlp.shared_experts.gate_proj", "model.layers.27.mlp.shared_experts.up_proj", "model.layers.27.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 4.1557056829334e-05, "dbits": 23592960 }, { "dkld": 7.563238032162224e-05, "dbits": 47185920 } ] }, { "idx": 163, "layers": [ "model.layers.27.mlp.experts.0.gate_proj", "model.layers.27.mlp.experts.1.gate_proj", "model.layers.27.mlp.experts.2.gate_proj", "model.layers.27.mlp.experts.3.gate_proj", "model.layers.27.mlp.experts.4.gate_proj", "model.layers.27.mlp.experts.5.gate_proj", "model.layers.27.mlp.experts.6.gate_proj", "model.layers.27.mlp.experts.7.gate_proj", "model.layers.27.mlp.experts.8.gate_proj", "model.layers.27.mlp.experts.9.gate_proj", "model.layers.27.mlp.experts.10.gate_proj", "model.layers.27.mlp.experts.11.gate_proj", "model.layers.27.mlp.experts.12.gate_proj", "model.layers.27.mlp.experts.13.gate_proj", "model.layers.27.mlp.experts.14.gate_proj", "model.layers.27.mlp.experts.15.gate_proj", "model.layers.27.mlp.experts.16.gate_proj", "model.layers.27.mlp.experts.17.gate_proj", "model.layers.27.mlp.experts.18.gate_proj", "model.layers.27.mlp.experts.19.gate_proj", "model.layers.27.mlp.experts.20.gate_proj", "model.layers.27.mlp.experts.21.gate_proj", "model.layers.27.mlp.experts.22.gate_proj", "model.layers.27.mlp.experts.23.gate_proj", "model.layers.27.mlp.experts.24.gate_proj", "model.layers.27.mlp.experts.25.gate_proj", "model.layers.27.mlp.experts.26.gate_proj", "model.layers.27.mlp.experts.27.gate_proj", "model.layers.27.mlp.experts.28.gate_proj", "model.layers.27.mlp.experts.29.gate_proj", "model.layers.27.mlp.experts.30.gate_proj", "model.layers.27.mlp.experts.31.gate_proj", "model.layers.27.mlp.experts.32.gate_proj", "model.layers.27.mlp.experts.33.gate_proj", "model.layers.27.mlp.experts.34.gate_proj", "model.layers.27.mlp.experts.35.gate_proj", "model.layers.27.mlp.experts.36.gate_proj", "model.layers.27.mlp.experts.37.gate_proj", "model.layers.27.mlp.experts.38.gate_proj", "model.layers.27.mlp.experts.39.gate_proj", "model.layers.27.mlp.experts.40.gate_proj", "model.layers.27.mlp.experts.41.gate_proj", "model.layers.27.mlp.experts.42.gate_proj", "model.layers.27.mlp.experts.43.gate_proj", "model.layers.27.mlp.experts.44.gate_proj", "model.layers.27.mlp.experts.45.gate_proj", "model.layers.27.mlp.experts.46.gate_proj", "model.layers.27.mlp.experts.47.gate_proj", "model.layers.27.mlp.experts.48.gate_proj", "model.layers.27.mlp.experts.49.gate_proj", "model.layers.27.mlp.experts.50.gate_proj", "model.layers.27.mlp.experts.51.gate_proj", "model.layers.27.mlp.experts.52.gate_proj", "model.layers.27.mlp.experts.53.gate_proj", "model.layers.27.mlp.experts.54.gate_proj", "model.layers.27.mlp.experts.55.gate_proj", "model.layers.27.mlp.experts.56.gate_proj", "model.layers.27.mlp.experts.57.gate_proj", "model.layers.27.mlp.experts.58.gate_proj", "model.layers.27.mlp.experts.59.gate_proj", "model.layers.27.mlp.experts.60.gate_proj", "model.layers.27.mlp.experts.61.gate_proj", "model.layers.27.mlp.experts.62.gate_proj", "model.layers.27.mlp.experts.63.gate_proj", "model.layers.27.mlp.experts.64.gate_proj", "model.layers.27.mlp.experts.65.gate_proj", "model.layers.27.mlp.experts.66.gate_proj", "model.layers.27.mlp.experts.67.gate_proj", "model.layers.27.mlp.experts.68.gate_proj", "model.layers.27.mlp.experts.69.gate_proj", "model.layers.27.mlp.experts.70.gate_proj", "model.layers.27.mlp.experts.71.gate_proj", "model.layers.27.mlp.experts.72.gate_proj", "model.layers.27.mlp.experts.73.gate_proj", "model.layers.27.mlp.experts.74.gate_proj", "model.layers.27.mlp.experts.75.gate_proj", "model.layers.27.mlp.experts.76.gate_proj", "model.layers.27.mlp.experts.77.gate_proj", "model.layers.27.mlp.experts.78.gate_proj", "model.layers.27.mlp.experts.79.gate_proj", "model.layers.27.mlp.experts.80.gate_proj", "model.layers.27.mlp.experts.81.gate_proj", "model.layers.27.mlp.experts.82.gate_proj", "model.layers.27.mlp.experts.83.gate_proj", "model.layers.27.mlp.experts.84.gate_proj", "model.layers.27.mlp.experts.85.gate_proj", "model.layers.27.mlp.experts.86.gate_proj", "model.layers.27.mlp.experts.87.gate_proj", "model.layers.27.mlp.experts.88.gate_proj", "model.layers.27.mlp.experts.89.gate_proj", "model.layers.27.mlp.experts.90.gate_proj", "model.layers.27.mlp.experts.91.gate_proj", "model.layers.27.mlp.experts.92.gate_proj", "model.layers.27.mlp.experts.93.gate_proj", "model.layers.27.mlp.experts.94.gate_proj", "model.layers.27.mlp.experts.95.gate_proj", "model.layers.27.mlp.experts.96.gate_proj", "model.layers.27.mlp.experts.97.gate_proj", "model.layers.27.mlp.experts.98.gate_proj", "model.layers.27.mlp.experts.99.gate_proj", "model.layers.27.mlp.experts.100.gate_proj", "model.layers.27.mlp.experts.101.gate_proj", "model.layers.27.mlp.experts.102.gate_proj", "model.layers.27.mlp.experts.103.gate_proj", "model.layers.27.mlp.experts.104.gate_proj", "model.layers.27.mlp.experts.105.gate_proj", "model.layers.27.mlp.experts.106.gate_proj", "model.layers.27.mlp.experts.107.gate_proj", "model.layers.27.mlp.experts.108.gate_proj", "model.layers.27.mlp.experts.109.gate_proj", "model.layers.27.mlp.experts.110.gate_proj", "model.layers.27.mlp.experts.111.gate_proj", "model.layers.27.mlp.experts.112.gate_proj", "model.layers.27.mlp.experts.113.gate_proj", "model.layers.27.mlp.experts.114.gate_proj", "model.layers.27.mlp.experts.115.gate_proj", "model.layers.27.mlp.experts.116.gate_proj", "model.layers.27.mlp.experts.117.gate_proj", "model.layers.27.mlp.experts.118.gate_proj", "model.layers.27.mlp.experts.119.gate_proj", "model.layers.27.mlp.experts.120.gate_proj", "model.layers.27.mlp.experts.121.gate_proj", "model.layers.27.mlp.experts.122.gate_proj", "model.layers.27.mlp.experts.123.gate_proj", "model.layers.27.mlp.experts.124.gate_proj", "model.layers.27.mlp.experts.125.gate_proj", "model.layers.27.mlp.experts.126.gate_proj", "model.layers.27.mlp.experts.127.gate_proj", "model.layers.27.mlp.experts.128.gate_proj", "model.layers.27.mlp.experts.129.gate_proj", "model.layers.27.mlp.experts.130.gate_proj", "model.layers.27.mlp.experts.131.gate_proj", "model.layers.27.mlp.experts.132.gate_proj", "model.layers.27.mlp.experts.133.gate_proj", "model.layers.27.mlp.experts.134.gate_proj", "model.layers.27.mlp.experts.135.gate_proj", "model.layers.27.mlp.experts.136.gate_proj", "model.layers.27.mlp.experts.137.gate_proj", "model.layers.27.mlp.experts.138.gate_proj", "model.layers.27.mlp.experts.139.gate_proj", "model.layers.27.mlp.experts.140.gate_proj", "model.layers.27.mlp.experts.141.gate_proj", "model.layers.27.mlp.experts.142.gate_proj", "model.layers.27.mlp.experts.143.gate_proj", "model.layers.27.mlp.experts.144.gate_proj", "model.layers.27.mlp.experts.145.gate_proj", "model.layers.27.mlp.experts.146.gate_proj", "model.layers.27.mlp.experts.147.gate_proj", "model.layers.27.mlp.experts.148.gate_proj", "model.layers.27.mlp.experts.149.gate_proj", "model.layers.27.mlp.experts.150.gate_proj", "model.layers.27.mlp.experts.151.gate_proj", "model.layers.27.mlp.experts.152.gate_proj", "model.layers.27.mlp.experts.153.gate_proj", "model.layers.27.mlp.experts.154.gate_proj", "model.layers.27.mlp.experts.155.gate_proj", "model.layers.27.mlp.experts.156.gate_proj", "model.layers.27.mlp.experts.157.gate_proj", "model.layers.27.mlp.experts.158.gate_proj", "model.layers.27.mlp.experts.159.gate_proj", "model.layers.27.mlp.experts.0.up_proj", "model.layers.27.mlp.experts.1.up_proj", "model.layers.27.mlp.experts.2.up_proj", "model.layers.27.mlp.experts.3.up_proj", "model.layers.27.mlp.experts.4.up_proj", "model.layers.27.mlp.experts.5.up_proj", "model.layers.27.mlp.experts.6.up_proj", "model.layers.27.mlp.experts.7.up_proj", "model.layers.27.mlp.experts.8.up_proj", "model.layers.27.mlp.experts.9.up_proj", "model.layers.27.mlp.experts.10.up_proj", "model.layers.27.mlp.experts.11.up_proj", "model.layers.27.mlp.experts.12.up_proj", "model.layers.27.mlp.experts.13.up_proj", "model.layers.27.mlp.experts.14.up_proj", "model.layers.27.mlp.experts.15.up_proj", "model.layers.27.mlp.experts.16.up_proj", "model.layers.27.mlp.experts.17.up_proj", "model.layers.27.mlp.experts.18.up_proj", "model.layers.27.mlp.experts.19.up_proj", "model.layers.27.mlp.experts.20.up_proj", "model.layers.27.mlp.experts.21.up_proj", "model.layers.27.mlp.experts.22.up_proj", "model.layers.27.mlp.experts.23.up_proj", "model.layers.27.mlp.experts.24.up_proj", "model.layers.27.mlp.experts.25.up_proj", "model.layers.27.mlp.experts.26.up_proj", "model.layers.27.mlp.experts.27.up_proj", "model.layers.27.mlp.experts.28.up_proj", "model.layers.27.mlp.experts.29.up_proj", "model.layers.27.mlp.experts.30.up_proj", "model.layers.27.mlp.experts.31.up_proj", "model.layers.27.mlp.experts.32.up_proj", "model.layers.27.mlp.experts.33.up_proj", "model.layers.27.mlp.experts.34.up_proj", "model.layers.27.mlp.experts.35.up_proj", "model.layers.27.mlp.experts.36.up_proj", "model.layers.27.mlp.experts.37.up_proj", "model.layers.27.mlp.experts.38.up_proj", "model.layers.27.mlp.experts.39.up_proj", "model.layers.27.mlp.experts.40.up_proj", "model.layers.27.mlp.experts.41.up_proj", "model.layers.27.mlp.experts.42.up_proj", "model.layers.27.mlp.experts.43.up_proj", "model.layers.27.mlp.experts.44.up_proj", "model.layers.27.mlp.experts.45.up_proj", "model.layers.27.mlp.experts.46.up_proj", "model.layers.27.mlp.experts.47.up_proj", "model.layers.27.mlp.experts.48.up_proj", "model.layers.27.mlp.experts.49.up_proj", "model.layers.27.mlp.experts.50.up_proj", "model.layers.27.mlp.experts.51.up_proj", "model.layers.27.mlp.experts.52.up_proj", "model.layers.27.mlp.experts.53.up_proj", "model.layers.27.mlp.experts.54.up_proj", "model.layers.27.mlp.experts.55.up_proj", "model.layers.27.mlp.experts.56.up_proj", "model.layers.27.mlp.experts.57.up_proj", "model.layers.27.mlp.experts.58.up_proj", "model.layers.27.mlp.experts.59.up_proj", "model.layers.27.mlp.experts.60.up_proj", "model.layers.27.mlp.experts.61.up_proj", "model.layers.27.mlp.experts.62.up_proj", "model.layers.27.mlp.experts.63.up_proj", "model.layers.27.mlp.experts.64.up_proj", "model.layers.27.mlp.experts.65.up_proj", "model.layers.27.mlp.experts.66.up_proj", "model.layers.27.mlp.experts.67.up_proj", "model.layers.27.mlp.experts.68.up_proj", "model.layers.27.mlp.experts.69.up_proj", "model.layers.27.mlp.experts.70.up_proj", "model.layers.27.mlp.experts.71.up_proj", "model.layers.27.mlp.experts.72.up_proj", "model.layers.27.mlp.experts.73.up_proj", "model.layers.27.mlp.experts.74.up_proj", "model.layers.27.mlp.experts.75.up_proj", "model.layers.27.mlp.experts.76.up_proj", "model.layers.27.mlp.experts.77.up_proj", "model.layers.27.mlp.experts.78.up_proj", "model.layers.27.mlp.experts.79.up_proj", "model.layers.27.mlp.experts.80.up_proj", "model.layers.27.mlp.experts.81.up_proj", "model.layers.27.mlp.experts.82.up_proj", "model.layers.27.mlp.experts.83.up_proj", "model.layers.27.mlp.experts.84.up_proj", "model.layers.27.mlp.experts.85.up_proj", "model.layers.27.mlp.experts.86.up_proj", "model.layers.27.mlp.experts.87.up_proj", "model.layers.27.mlp.experts.88.up_proj", "model.layers.27.mlp.experts.89.up_proj", "model.layers.27.mlp.experts.90.up_proj", "model.layers.27.mlp.experts.91.up_proj", "model.layers.27.mlp.experts.92.up_proj", "model.layers.27.mlp.experts.93.up_proj", "model.layers.27.mlp.experts.94.up_proj", "model.layers.27.mlp.experts.95.up_proj", "model.layers.27.mlp.experts.96.up_proj", "model.layers.27.mlp.experts.97.up_proj", "model.layers.27.mlp.experts.98.up_proj", "model.layers.27.mlp.experts.99.up_proj", "model.layers.27.mlp.experts.100.up_proj", "model.layers.27.mlp.experts.101.up_proj", "model.layers.27.mlp.experts.102.up_proj", "model.layers.27.mlp.experts.103.up_proj", "model.layers.27.mlp.experts.104.up_proj", "model.layers.27.mlp.experts.105.up_proj", "model.layers.27.mlp.experts.106.up_proj", "model.layers.27.mlp.experts.107.up_proj", "model.layers.27.mlp.experts.108.up_proj", "model.layers.27.mlp.experts.109.up_proj", "model.layers.27.mlp.experts.110.up_proj", "model.layers.27.mlp.experts.111.up_proj", "model.layers.27.mlp.experts.112.up_proj", "model.layers.27.mlp.experts.113.up_proj", "model.layers.27.mlp.experts.114.up_proj", "model.layers.27.mlp.experts.115.up_proj", "model.layers.27.mlp.experts.116.up_proj", "model.layers.27.mlp.experts.117.up_proj", "model.layers.27.mlp.experts.118.up_proj", "model.layers.27.mlp.experts.119.up_proj", "model.layers.27.mlp.experts.120.up_proj", "model.layers.27.mlp.experts.121.up_proj", "model.layers.27.mlp.experts.122.up_proj", "model.layers.27.mlp.experts.123.up_proj", "model.layers.27.mlp.experts.124.up_proj", "model.layers.27.mlp.experts.125.up_proj", "model.layers.27.mlp.experts.126.up_proj", "model.layers.27.mlp.experts.127.up_proj", "model.layers.27.mlp.experts.128.up_proj", "model.layers.27.mlp.experts.129.up_proj", "model.layers.27.mlp.experts.130.up_proj", "model.layers.27.mlp.experts.131.up_proj", "model.layers.27.mlp.experts.132.up_proj", "model.layers.27.mlp.experts.133.up_proj", "model.layers.27.mlp.experts.134.up_proj", "model.layers.27.mlp.experts.135.up_proj", "model.layers.27.mlp.experts.136.up_proj", "model.layers.27.mlp.experts.137.up_proj", "model.layers.27.mlp.experts.138.up_proj", "model.layers.27.mlp.experts.139.up_proj", "model.layers.27.mlp.experts.140.up_proj", "model.layers.27.mlp.experts.141.up_proj", "model.layers.27.mlp.experts.142.up_proj", "model.layers.27.mlp.experts.143.up_proj", "model.layers.27.mlp.experts.144.up_proj", "model.layers.27.mlp.experts.145.up_proj", "model.layers.27.mlp.experts.146.up_proj", "model.layers.27.mlp.experts.147.up_proj", "model.layers.27.mlp.experts.148.up_proj", "model.layers.27.mlp.experts.149.up_proj", "model.layers.27.mlp.experts.150.up_proj", "model.layers.27.mlp.experts.151.up_proj", "model.layers.27.mlp.experts.152.up_proj", "model.layers.27.mlp.experts.153.up_proj", "model.layers.27.mlp.experts.154.up_proj", "model.layers.27.mlp.experts.155.up_proj", "model.layers.27.mlp.experts.156.up_proj", "model.layers.27.mlp.experts.157.up_proj", "model.layers.27.mlp.experts.158.up_proj", "model.layers.27.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -8.54511745274067e-06, "dbits": 2516582400 }, { "dkld": -2.0471448078750523e-05, "dbits": 5033164800 } ] }, { "idx": 164, "layers": [ "model.layers.27.mlp.experts.0.down_proj", "model.layers.27.mlp.experts.1.down_proj", "model.layers.27.mlp.experts.2.down_proj", "model.layers.27.mlp.experts.3.down_proj", "model.layers.27.mlp.experts.4.down_proj", "model.layers.27.mlp.experts.5.down_proj", "model.layers.27.mlp.experts.6.down_proj", "model.layers.27.mlp.experts.7.down_proj", "model.layers.27.mlp.experts.8.down_proj", "model.layers.27.mlp.experts.9.down_proj", "model.layers.27.mlp.experts.10.down_proj", "model.layers.27.mlp.experts.11.down_proj", "model.layers.27.mlp.experts.12.down_proj", "model.layers.27.mlp.experts.13.down_proj", "model.layers.27.mlp.experts.14.down_proj", "model.layers.27.mlp.experts.15.down_proj", "model.layers.27.mlp.experts.16.down_proj", "model.layers.27.mlp.experts.17.down_proj", "model.layers.27.mlp.experts.18.down_proj", "model.layers.27.mlp.experts.19.down_proj", "model.layers.27.mlp.experts.20.down_proj", "model.layers.27.mlp.experts.21.down_proj", "model.layers.27.mlp.experts.22.down_proj", "model.layers.27.mlp.experts.23.down_proj", "model.layers.27.mlp.experts.24.down_proj", "model.layers.27.mlp.experts.25.down_proj", "model.layers.27.mlp.experts.26.down_proj", "model.layers.27.mlp.experts.27.down_proj", "model.layers.27.mlp.experts.28.down_proj", "model.layers.27.mlp.experts.29.down_proj", "model.layers.27.mlp.experts.30.down_proj", "model.layers.27.mlp.experts.31.down_proj", "model.layers.27.mlp.experts.32.down_proj", "model.layers.27.mlp.experts.33.down_proj", "model.layers.27.mlp.experts.34.down_proj", "model.layers.27.mlp.experts.35.down_proj", "model.layers.27.mlp.experts.36.down_proj", "model.layers.27.mlp.experts.37.down_proj", "model.layers.27.mlp.experts.38.down_proj", "model.layers.27.mlp.experts.39.down_proj", "model.layers.27.mlp.experts.40.down_proj", "model.layers.27.mlp.experts.41.down_proj", "model.layers.27.mlp.experts.42.down_proj", "model.layers.27.mlp.experts.43.down_proj", "model.layers.27.mlp.experts.44.down_proj", "model.layers.27.mlp.experts.45.down_proj", "model.layers.27.mlp.experts.46.down_proj", "model.layers.27.mlp.experts.47.down_proj", "model.layers.27.mlp.experts.48.down_proj", "model.layers.27.mlp.experts.49.down_proj", "model.layers.27.mlp.experts.50.down_proj", "model.layers.27.mlp.experts.51.down_proj", "model.layers.27.mlp.experts.52.down_proj", "model.layers.27.mlp.experts.53.down_proj", "model.layers.27.mlp.experts.54.down_proj", "model.layers.27.mlp.experts.55.down_proj", "model.layers.27.mlp.experts.56.down_proj", "model.layers.27.mlp.experts.57.down_proj", "model.layers.27.mlp.experts.58.down_proj", "model.layers.27.mlp.experts.59.down_proj", "model.layers.27.mlp.experts.60.down_proj", "model.layers.27.mlp.experts.61.down_proj", "model.layers.27.mlp.experts.62.down_proj", "model.layers.27.mlp.experts.63.down_proj", "model.layers.27.mlp.experts.64.down_proj", "model.layers.27.mlp.experts.65.down_proj", "model.layers.27.mlp.experts.66.down_proj", "model.layers.27.mlp.experts.67.down_proj", "model.layers.27.mlp.experts.68.down_proj", "model.layers.27.mlp.experts.69.down_proj", "model.layers.27.mlp.experts.70.down_proj", "model.layers.27.mlp.experts.71.down_proj", "model.layers.27.mlp.experts.72.down_proj", "model.layers.27.mlp.experts.73.down_proj", "model.layers.27.mlp.experts.74.down_proj", "model.layers.27.mlp.experts.75.down_proj", "model.layers.27.mlp.experts.76.down_proj", "model.layers.27.mlp.experts.77.down_proj", "model.layers.27.mlp.experts.78.down_proj", "model.layers.27.mlp.experts.79.down_proj", "model.layers.27.mlp.experts.80.down_proj", "model.layers.27.mlp.experts.81.down_proj", "model.layers.27.mlp.experts.82.down_proj", "model.layers.27.mlp.experts.83.down_proj", "model.layers.27.mlp.experts.84.down_proj", "model.layers.27.mlp.experts.85.down_proj", "model.layers.27.mlp.experts.86.down_proj", "model.layers.27.mlp.experts.87.down_proj", "model.layers.27.mlp.experts.88.down_proj", "model.layers.27.mlp.experts.89.down_proj", "model.layers.27.mlp.experts.90.down_proj", "model.layers.27.mlp.experts.91.down_proj", "model.layers.27.mlp.experts.92.down_proj", "model.layers.27.mlp.experts.93.down_proj", "model.layers.27.mlp.experts.94.down_proj", "model.layers.27.mlp.experts.95.down_proj", "model.layers.27.mlp.experts.96.down_proj", "model.layers.27.mlp.experts.97.down_proj", "model.layers.27.mlp.experts.98.down_proj", "model.layers.27.mlp.experts.99.down_proj", "model.layers.27.mlp.experts.100.down_proj", "model.layers.27.mlp.experts.101.down_proj", "model.layers.27.mlp.experts.102.down_proj", "model.layers.27.mlp.experts.103.down_proj", "model.layers.27.mlp.experts.104.down_proj", "model.layers.27.mlp.experts.105.down_proj", "model.layers.27.mlp.experts.106.down_proj", "model.layers.27.mlp.experts.107.down_proj", "model.layers.27.mlp.experts.108.down_proj", "model.layers.27.mlp.experts.109.down_proj", "model.layers.27.mlp.experts.110.down_proj", "model.layers.27.mlp.experts.111.down_proj", "model.layers.27.mlp.experts.112.down_proj", "model.layers.27.mlp.experts.113.down_proj", "model.layers.27.mlp.experts.114.down_proj", "model.layers.27.mlp.experts.115.down_proj", "model.layers.27.mlp.experts.116.down_proj", "model.layers.27.mlp.experts.117.down_proj", "model.layers.27.mlp.experts.118.down_proj", "model.layers.27.mlp.experts.119.down_proj", "model.layers.27.mlp.experts.120.down_proj", "model.layers.27.mlp.experts.121.down_proj", "model.layers.27.mlp.experts.122.down_proj", "model.layers.27.mlp.experts.123.down_proj", "model.layers.27.mlp.experts.124.down_proj", "model.layers.27.mlp.experts.125.down_proj", "model.layers.27.mlp.experts.126.down_proj", "model.layers.27.mlp.experts.127.down_proj", "model.layers.27.mlp.experts.128.down_proj", "model.layers.27.mlp.experts.129.down_proj", "model.layers.27.mlp.experts.130.down_proj", "model.layers.27.mlp.experts.131.down_proj", "model.layers.27.mlp.experts.132.down_proj", "model.layers.27.mlp.experts.133.down_proj", "model.layers.27.mlp.experts.134.down_proj", "model.layers.27.mlp.experts.135.down_proj", "model.layers.27.mlp.experts.136.down_proj", "model.layers.27.mlp.experts.137.down_proj", "model.layers.27.mlp.experts.138.down_proj", "model.layers.27.mlp.experts.139.down_proj", "model.layers.27.mlp.experts.140.down_proj", "model.layers.27.mlp.experts.141.down_proj", "model.layers.27.mlp.experts.142.down_proj", "model.layers.27.mlp.experts.143.down_proj", "model.layers.27.mlp.experts.144.down_proj", "model.layers.27.mlp.experts.145.down_proj", "model.layers.27.mlp.experts.146.down_proj", "model.layers.27.mlp.experts.147.down_proj", "model.layers.27.mlp.experts.148.down_proj", "model.layers.27.mlp.experts.149.down_proj", "model.layers.27.mlp.experts.150.down_proj", "model.layers.27.mlp.experts.151.down_proj", "model.layers.27.mlp.experts.152.down_proj", "model.layers.27.mlp.experts.153.down_proj", "model.layers.27.mlp.experts.154.down_proj", "model.layers.27.mlp.experts.155.down_proj", "model.layers.27.mlp.experts.156.down_proj", "model.layers.27.mlp.experts.157.down_proj", "model.layers.27.mlp.experts.158.down_proj", "model.layers.27.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -3.7075020372867584e-05, "dbits": 1258291200 }, { "dkld": -5.7994667440651806e-05, "dbits": 2516582400 } ] }, { "idx": 165, "layers": [ "model.layers.28.self_attn.q_proj" ], "candidates": [ { "dkld": -4.551615566015209e-05, "dbits": 62914560 }, { "dkld": -4.206113517284289e-05, "dbits": 125829120 } ] }, { "idx": 166, "layers": [ "model.layers.28.self_attn.k_proj", "model.layers.28.self_attn.v_proj" ], "candidates": [ { "dkld": -0.0001665099523961537, "dbits": 10485760 }, { "dkld": -0.00017738807946443558, "dbits": 20971520 } ] }, { "idx": 167, "layers": [ "model.layers.28.self_attn.o_proj" ], "candidates": [ { "dkld": -0.00010382721666246653, "dbits": 62914560 }, { "dkld": -0.00011047790758311749, "dbits": 125829120 } ] }, { "idx": 168, "layers": [ "model.layers.28.mlp.shared_experts.gate_proj", "model.layers.28.mlp.shared_experts.up_proj", "model.layers.28.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -3.0659604817618452e-06, "dbits": 23592960 }, { "dkld": -0.00013764582108706166, "dbits": 47185920 } ] }, { "idx": 169, "layers": [ "model.layers.28.mlp.experts.0.gate_proj", "model.layers.28.mlp.experts.1.gate_proj", "model.layers.28.mlp.experts.2.gate_proj", "model.layers.28.mlp.experts.3.gate_proj", "model.layers.28.mlp.experts.4.gate_proj", "model.layers.28.mlp.experts.5.gate_proj", "model.layers.28.mlp.experts.6.gate_proj", "model.layers.28.mlp.experts.7.gate_proj", "model.layers.28.mlp.experts.8.gate_proj", "model.layers.28.mlp.experts.9.gate_proj", "model.layers.28.mlp.experts.10.gate_proj", "model.layers.28.mlp.experts.11.gate_proj", "model.layers.28.mlp.experts.12.gate_proj", "model.layers.28.mlp.experts.13.gate_proj", "model.layers.28.mlp.experts.14.gate_proj", "model.layers.28.mlp.experts.15.gate_proj", "model.layers.28.mlp.experts.16.gate_proj", "model.layers.28.mlp.experts.17.gate_proj", "model.layers.28.mlp.experts.18.gate_proj", "model.layers.28.mlp.experts.19.gate_proj", "model.layers.28.mlp.experts.20.gate_proj", "model.layers.28.mlp.experts.21.gate_proj", "model.layers.28.mlp.experts.22.gate_proj", "model.layers.28.mlp.experts.23.gate_proj", "model.layers.28.mlp.experts.24.gate_proj", "model.layers.28.mlp.experts.25.gate_proj", "model.layers.28.mlp.experts.26.gate_proj", "model.layers.28.mlp.experts.27.gate_proj", "model.layers.28.mlp.experts.28.gate_proj", "model.layers.28.mlp.experts.29.gate_proj", "model.layers.28.mlp.experts.30.gate_proj", "model.layers.28.mlp.experts.31.gate_proj", "model.layers.28.mlp.experts.32.gate_proj", "model.layers.28.mlp.experts.33.gate_proj", "model.layers.28.mlp.experts.34.gate_proj", "model.layers.28.mlp.experts.35.gate_proj", "model.layers.28.mlp.experts.36.gate_proj", "model.layers.28.mlp.experts.37.gate_proj", "model.layers.28.mlp.experts.38.gate_proj", "model.layers.28.mlp.experts.39.gate_proj", "model.layers.28.mlp.experts.40.gate_proj", "model.layers.28.mlp.experts.41.gate_proj", "model.layers.28.mlp.experts.42.gate_proj", "model.layers.28.mlp.experts.43.gate_proj", "model.layers.28.mlp.experts.44.gate_proj", "model.layers.28.mlp.experts.45.gate_proj", "model.layers.28.mlp.experts.46.gate_proj", "model.layers.28.mlp.experts.47.gate_proj", "model.layers.28.mlp.experts.48.gate_proj", "model.layers.28.mlp.experts.49.gate_proj", "model.layers.28.mlp.experts.50.gate_proj", "model.layers.28.mlp.experts.51.gate_proj", "model.layers.28.mlp.experts.52.gate_proj", "model.layers.28.mlp.experts.53.gate_proj", "model.layers.28.mlp.experts.54.gate_proj", "model.layers.28.mlp.experts.55.gate_proj", "model.layers.28.mlp.experts.56.gate_proj", "model.layers.28.mlp.experts.57.gate_proj", "model.layers.28.mlp.experts.58.gate_proj", "model.layers.28.mlp.experts.59.gate_proj", "model.layers.28.mlp.experts.60.gate_proj", "model.layers.28.mlp.experts.61.gate_proj", "model.layers.28.mlp.experts.62.gate_proj", "model.layers.28.mlp.experts.63.gate_proj", "model.layers.28.mlp.experts.64.gate_proj", "model.layers.28.mlp.experts.65.gate_proj", "model.layers.28.mlp.experts.66.gate_proj", "model.layers.28.mlp.experts.67.gate_proj", "model.layers.28.mlp.experts.68.gate_proj", "model.layers.28.mlp.experts.69.gate_proj", "model.layers.28.mlp.experts.70.gate_proj", "model.layers.28.mlp.experts.71.gate_proj", "model.layers.28.mlp.experts.72.gate_proj", "model.layers.28.mlp.experts.73.gate_proj", "model.layers.28.mlp.experts.74.gate_proj", "model.layers.28.mlp.experts.75.gate_proj", "model.layers.28.mlp.experts.76.gate_proj", "model.layers.28.mlp.experts.77.gate_proj", "model.layers.28.mlp.experts.78.gate_proj", "model.layers.28.mlp.experts.79.gate_proj", "model.layers.28.mlp.experts.80.gate_proj", "model.layers.28.mlp.experts.81.gate_proj", "model.layers.28.mlp.experts.82.gate_proj", "model.layers.28.mlp.experts.83.gate_proj", "model.layers.28.mlp.experts.84.gate_proj", "model.layers.28.mlp.experts.85.gate_proj", "model.layers.28.mlp.experts.86.gate_proj", "model.layers.28.mlp.experts.87.gate_proj", "model.layers.28.mlp.experts.88.gate_proj", "model.layers.28.mlp.experts.89.gate_proj", "model.layers.28.mlp.experts.90.gate_proj", "model.layers.28.mlp.experts.91.gate_proj", "model.layers.28.mlp.experts.92.gate_proj", "model.layers.28.mlp.experts.93.gate_proj", "model.layers.28.mlp.experts.94.gate_proj", "model.layers.28.mlp.experts.95.gate_proj", "model.layers.28.mlp.experts.96.gate_proj", "model.layers.28.mlp.experts.97.gate_proj", "model.layers.28.mlp.experts.98.gate_proj", "model.layers.28.mlp.experts.99.gate_proj", "model.layers.28.mlp.experts.100.gate_proj", "model.layers.28.mlp.experts.101.gate_proj", "model.layers.28.mlp.experts.102.gate_proj", "model.layers.28.mlp.experts.103.gate_proj", "model.layers.28.mlp.experts.104.gate_proj", "model.layers.28.mlp.experts.105.gate_proj", "model.layers.28.mlp.experts.106.gate_proj", "model.layers.28.mlp.experts.107.gate_proj", "model.layers.28.mlp.experts.108.gate_proj", "model.layers.28.mlp.experts.109.gate_proj", "model.layers.28.mlp.experts.110.gate_proj", "model.layers.28.mlp.experts.111.gate_proj", "model.layers.28.mlp.experts.112.gate_proj", "model.layers.28.mlp.experts.113.gate_proj", "model.layers.28.mlp.experts.114.gate_proj", "model.layers.28.mlp.experts.115.gate_proj", "model.layers.28.mlp.experts.116.gate_proj", "model.layers.28.mlp.experts.117.gate_proj", "model.layers.28.mlp.experts.118.gate_proj", "model.layers.28.mlp.experts.119.gate_proj", "model.layers.28.mlp.experts.120.gate_proj", "model.layers.28.mlp.experts.121.gate_proj", "model.layers.28.mlp.experts.122.gate_proj", "model.layers.28.mlp.experts.123.gate_proj", "model.layers.28.mlp.experts.124.gate_proj", "model.layers.28.mlp.experts.125.gate_proj", "model.layers.28.mlp.experts.126.gate_proj", "model.layers.28.mlp.experts.127.gate_proj", "model.layers.28.mlp.experts.128.gate_proj", "model.layers.28.mlp.experts.129.gate_proj", "model.layers.28.mlp.experts.130.gate_proj", "model.layers.28.mlp.experts.131.gate_proj", "model.layers.28.mlp.experts.132.gate_proj", "model.layers.28.mlp.experts.133.gate_proj", "model.layers.28.mlp.experts.134.gate_proj", "model.layers.28.mlp.experts.135.gate_proj", "model.layers.28.mlp.experts.136.gate_proj", "model.layers.28.mlp.experts.137.gate_proj", "model.layers.28.mlp.experts.138.gate_proj", "model.layers.28.mlp.experts.139.gate_proj", "model.layers.28.mlp.experts.140.gate_proj", "model.layers.28.mlp.experts.141.gate_proj", "model.layers.28.mlp.experts.142.gate_proj", "model.layers.28.mlp.experts.143.gate_proj", "model.layers.28.mlp.experts.144.gate_proj", "model.layers.28.mlp.experts.145.gate_proj", "model.layers.28.mlp.experts.146.gate_proj", "model.layers.28.mlp.experts.147.gate_proj", "model.layers.28.mlp.experts.148.gate_proj", "model.layers.28.mlp.experts.149.gate_proj", "model.layers.28.mlp.experts.150.gate_proj", "model.layers.28.mlp.experts.151.gate_proj", "model.layers.28.mlp.experts.152.gate_proj", "model.layers.28.mlp.experts.153.gate_proj", "model.layers.28.mlp.experts.154.gate_proj", "model.layers.28.mlp.experts.155.gate_proj", "model.layers.28.mlp.experts.156.gate_proj", "model.layers.28.mlp.experts.157.gate_proj", "model.layers.28.mlp.experts.158.gate_proj", "model.layers.28.mlp.experts.159.gate_proj", "model.layers.28.mlp.experts.0.up_proj", "model.layers.28.mlp.experts.1.up_proj", "model.layers.28.mlp.experts.2.up_proj", "model.layers.28.mlp.experts.3.up_proj", "model.layers.28.mlp.experts.4.up_proj", "model.layers.28.mlp.experts.5.up_proj", "model.layers.28.mlp.experts.6.up_proj", "model.layers.28.mlp.experts.7.up_proj", "model.layers.28.mlp.experts.8.up_proj", "model.layers.28.mlp.experts.9.up_proj", "model.layers.28.mlp.experts.10.up_proj", "model.layers.28.mlp.experts.11.up_proj", "model.layers.28.mlp.experts.12.up_proj", "model.layers.28.mlp.experts.13.up_proj", "model.layers.28.mlp.experts.14.up_proj", "model.layers.28.mlp.experts.15.up_proj", "model.layers.28.mlp.experts.16.up_proj", "model.layers.28.mlp.experts.17.up_proj", "model.layers.28.mlp.experts.18.up_proj", "model.layers.28.mlp.experts.19.up_proj", "model.layers.28.mlp.experts.20.up_proj", "model.layers.28.mlp.experts.21.up_proj", "model.layers.28.mlp.experts.22.up_proj", "model.layers.28.mlp.experts.23.up_proj", "model.layers.28.mlp.experts.24.up_proj", "model.layers.28.mlp.experts.25.up_proj", "model.layers.28.mlp.experts.26.up_proj", "model.layers.28.mlp.experts.27.up_proj", "model.layers.28.mlp.experts.28.up_proj", "model.layers.28.mlp.experts.29.up_proj", "model.layers.28.mlp.experts.30.up_proj", "model.layers.28.mlp.experts.31.up_proj", "model.layers.28.mlp.experts.32.up_proj", "model.layers.28.mlp.experts.33.up_proj", "model.layers.28.mlp.experts.34.up_proj", "model.layers.28.mlp.experts.35.up_proj", "model.layers.28.mlp.experts.36.up_proj", "model.layers.28.mlp.experts.37.up_proj", "model.layers.28.mlp.experts.38.up_proj", "model.layers.28.mlp.experts.39.up_proj", "model.layers.28.mlp.experts.40.up_proj", "model.layers.28.mlp.experts.41.up_proj", "model.layers.28.mlp.experts.42.up_proj", "model.layers.28.mlp.experts.43.up_proj", "model.layers.28.mlp.experts.44.up_proj", "model.layers.28.mlp.experts.45.up_proj", "model.layers.28.mlp.experts.46.up_proj", "model.layers.28.mlp.experts.47.up_proj", "model.layers.28.mlp.experts.48.up_proj", "model.layers.28.mlp.experts.49.up_proj", "model.layers.28.mlp.experts.50.up_proj", "model.layers.28.mlp.experts.51.up_proj", "model.layers.28.mlp.experts.52.up_proj", "model.layers.28.mlp.experts.53.up_proj", "model.layers.28.mlp.experts.54.up_proj", "model.layers.28.mlp.experts.55.up_proj", "model.layers.28.mlp.experts.56.up_proj", "model.layers.28.mlp.experts.57.up_proj", "model.layers.28.mlp.experts.58.up_proj", "model.layers.28.mlp.experts.59.up_proj", "model.layers.28.mlp.experts.60.up_proj", "model.layers.28.mlp.experts.61.up_proj", "model.layers.28.mlp.experts.62.up_proj", "model.layers.28.mlp.experts.63.up_proj", "model.layers.28.mlp.experts.64.up_proj", "model.layers.28.mlp.experts.65.up_proj", "model.layers.28.mlp.experts.66.up_proj", "model.layers.28.mlp.experts.67.up_proj", "model.layers.28.mlp.experts.68.up_proj", "model.layers.28.mlp.experts.69.up_proj", "model.layers.28.mlp.experts.70.up_proj", "model.layers.28.mlp.experts.71.up_proj", "model.layers.28.mlp.experts.72.up_proj", "model.layers.28.mlp.experts.73.up_proj", "model.layers.28.mlp.experts.74.up_proj", "model.layers.28.mlp.experts.75.up_proj", "model.layers.28.mlp.experts.76.up_proj", "model.layers.28.mlp.experts.77.up_proj", "model.layers.28.mlp.experts.78.up_proj", "model.layers.28.mlp.experts.79.up_proj", "model.layers.28.mlp.experts.80.up_proj", "model.layers.28.mlp.experts.81.up_proj", "model.layers.28.mlp.experts.82.up_proj", "model.layers.28.mlp.experts.83.up_proj", "model.layers.28.mlp.experts.84.up_proj", "model.layers.28.mlp.experts.85.up_proj", "model.layers.28.mlp.experts.86.up_proj", "model.layers.28.mlp.experts.87.up_proj", "model.layers.28.mlp.experts.88.up_proj", "model.layers.28.mlp.experts.89.up_proj", "model.layers.28.mlp.experts.90.up_proj", "model.layers.28.mlp.experts.91.up_proj", "model.layers.28.mlp.experts.92.up_proj", "model.layers.28.mlp.experts.93.up_proj", "model.layers.28.mlp.experts.94.up_proj", "model.layers.28.mlp.experts.95.up_proj", "model.layers.28.mlp.experts.96.up_proj", "model.layers.28.mlp.experts.97.up_proj", "model.layers.28.mlp.experts.98.up_proj", "model.layers.28.mlp.experts.99.up_proj", "model.layers.28.mlp.experts.100.up_proj", "model.layers.28.mlp.experts.101.up_proj", "model.layers.28.mlp.experts.102.up_proj", "model.layers.28.mlp.experts.103.up_proj", "model.layers.28.mlp.experts.104.up_proj", "model.layers.28.mlp.experts.105.up_proj", "model.layers.28.mlp.experts.106.up_proj", "model.layers.28.mlp.experts.107.up_proj", "model.layers.28.mlp.experts.108.up_proj", "model.layers.28.mlp.experts.109.up_proj", "model.layers.28.mlp.experts.110.up_proj", "model.layers.28.mlp.experts.111.up_proj", "model.layers.28.mlp.experts.112.up_proj", "model.layers.28.mlp.experts.113.up_proj", "model.layers.28.mlp.experts.114.up_proj", "model.layers.28.mlp.experts.115.up_proj", "model.layers.28.mlp.experts.116.up_proj", "model.layers.28.mlp.experts.117.up_proj", "model.layers.28.mlp.experts.118.up_proj", "model.layers.28.mlp.experts.119.up_proj", "model.layers.28.mlp.experts.120.up_proj", "model.layers.28.mlp.experts.121.up_proj", "model.layers.28.mlp.experts.122.up_proj", "model.layers.28.mlp.experts.123.up_proj", "model.layers.28.mlp.experts.124.up_proj", "model.layers.28.mlp.experts.125.up_proj", "model.layers.28.mlp.experts.126.up_proj", "model.layers.28.mlp.experts.127.up_proj", "model.layers.28.mlp.experts.128.up_proj", "model.layers.28.mlp.experts.129.up_proj", "model.layers.28.mlp.experts.130.up_proj", "model.layers.28.mlp.experts.131.up_proj", "model.layers.28.mlp.experts.132.up_proj", "model.layers.28.mlp.experts.133.up_proj", "model.layers.28.mlp.experts.134.up_proj", "model.layers.28.mlp.experts.135.up_proj", "model.layers.28.mlp.experts.136.up_proj", "model.layers.28.mlp.experts.137.up_proj", "model.layers.28.mlp.experts.138.up_proj", "model.layers.28.mlp.experts.139.up_proj", "model.layers.28.mlp.experts.140.up_proj", "model.layers.28.mlp.experts.141.up_proj", "model.layers.28.mlp.experts.142.up_proj", "model.layers.28.mlp.experts.143.up_proj", "model.layers.28.mlp.experts.144.up_proj", "model.layers.28.mlp.experts.145.up_proj", "model.layers.28.mlp.experts.146.up_proj", "model.layers.28.mlp.experts.147.up_proj", "model.layers.28.mlp.experts.148.up_proj", "model.layers.28.mlp.experts.149.up_proj", "model.layers.28.mlp.experts.150.up_proj", "model.layers.28.mlp.experts.151.up_proj", "model.layers.28.mlp.experts.152.up_proj", "model.layers.28.mlp.experts.153.up_proj", "model.layers.28.mlp.experts.154.up_proj", "model.layers.28.mlp.experts.155.up_proj", "model.layers.28.mlp.experts.156.up_proj", "model.layers.28.mlp.experts.157.up_proj", "model.layers.28.mlp.experts.158.up_proj", "model.layers.28.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -7.650814950327378e-08, "dbits": 2516582400 }, { "dkld": -3.3814460039138794e-05, "dbits": 5033164800 } ] }, { "idx": 170, "layers": [ "model.layers.28.mlp.experts.0.down_proj", "model.layers.28.mlp.experts.1.down_proj", "model.layers.28.mlp.experts.2.down_proj", "model.layers.28.mlp.experts.3.down_proj", "model.layers.28.mlp.experts.4.down_proj", "model.layers.28.mlp.experts.5.down_proj", "model.layers.28.mlp.experts.6.down_proj", "model.layers.28.mlp.experts.7.down_proj", "model.layers.28.mlp.experts.8.down_proj", "model.layers.28.mlp.experts.9.down_proj", "model.layers.28.mlp.experts.10.down_proj", "model.layers.28.mlp.experts.11.down_proj", "model.layers.28.mlp.experts.12.down_proj", "model.layers.28.mlp.experts.13.down_proj", "model.layers.28.mlp.experts.14.down_proj", "model.layers.28.mlp.experts.15.down_proj", "model.layers.28.mlp.experts.16.down_proj", "model.layers.28.mlp.experts.17.down_proj", "model.layers.28.mlp.experts.18.down_proj", "model.layers.28.mlp.experts.19.down_proj", "model.layers.28.mlp.experts.20.down_proj", "model.layers.28.mlp.experts.21.down_proj", "model.layers.28.mlp.experts.22.down_proj", "model.layers.28.mlp.experts.23.down_proj", "model.layers.28.mlp.experts.24.down_proj", "model.layers.28.mlp.experts.25.down_proj", "model.layers.28.mlp.experts.26.down_proj", "model.layers.28.mlp.experts.27.down_proj", "model.layers.28.mlp.experts.28.down_proj", "model.layers.28.mlp.experts.29.down_proj", "model.layers.28.mlp.experts.30.down_proj", "model.layers.28.mlp.experts.31.down_proj", "model.layers.28.mlp.experts.32.down_proj", "model.layers.28.mlp.experts.33.down_proj", "model.layers.28.mlp.experts.34.down_proj", "model.layers.28.mlp.experts.35.down_proj", "model.layers.28.mlp.experts.36.down_proj", "model.layers.28.mlp.experts.37.down_proj", "model.layers.28.mlp.experts.38.down_proj", "model.layers.28.mlp.experts.39.down_proj", "model.layers.28.mlp.experts.40.down_proj", "model.layers.28.mlp.experts.41.down_proj", "model.layers.28.mlp.experts.42.down_proj", "model.layers.28.mlp.experts.43.down_proj", "model.layers.28.mlp.experts.44.down_proj", "model.layers.28.mlp.experts.45.down_proj", "model.layers.28.mlp.experts.46.down_proj", "model.layers.28.mlp.experts.47.down_proj", "model.layers.28.mlp.experts.48.down_proj", "model.layers.28.mlp.experts.49.down_proj", "model.layers.28.mlp.experts.50.down_proj", "model.layers.28.mlp.experts.51.down_proj", "model.layers.28.mlp.experts.52.down_proj", "model.layers.28.mlp.experts.53.down_proj", "model.layers.28.mlp.experts.54.down_proj", "model.layers.28.mlp.experts.55.down_proj", "model.layers.28.mlp.experts.56.down_proj", "model.layers.28.mlp.experts.57.down_proj", "model.layers.28.mlp.experts.58.down_proj", "model.layers.28.mlp.experts.59.down_proj", "model.layers.28.mlp.experts.60.down_proj", "model.layers.28.mlp.experts.61.down_proj", "model.layers.28.mlp.experts.62.down_proj", "model.layers.28.mlp.experts.63.down_proj", "model.layers.28.mlp.experts.64.down_proj", "model.layers.28.mlp.experts.65.down_proj", "model.layers.28.mlp.experts.66.down_proj", "model.layers.28.mlp.experts.67.down_proj", "model.layers.28.mlp.experts.68.down_proj", "model.layers.28.mlp.experts.69.down_proj", "model.layers.28.mlp.experts.70.down_proj", "model.layers.28.mlp.experts.71.down_proj", "model.layers.28.mlp.experts.72.down_proj", "model.layers.28.mlp.experts.73.down_proj", "model.layers.28.mlp.experts.74.down_proj", "model.layers.28.mlp.experts.75.down_proj", "model.layers.28.mlp.experts.76.down_proj", "model.layers.28.mlp.experts.77.down_proj", "model.layers.28.mlp.experts.78.down_proj", "model.layers.28.mlp.experts.79.down_proj", "model.layers.28.mlp.experts.80.down_proj", "model.layers.28.mlp.experts.81.down_proj", "model.layers.28.mlp.experts.82.down_proj", "model.layers.28.mlp.experts.83.down_proj", "model.layers.28.mlp.experts.84.down_proj", "model.layers.28.mlp.experts.85.down_proj", "model.layers.28.mlp.experts.86.down_proj", "model.layers.28.mlp.experts.87.down_proj", "model.layers.28.mlp.experts.88.down_proj", "model.layers.28.mlp.experts.89.down_proj", "model.layers.28.mlp.experts.90.down_proj", "model.layers.28.mlp.experts.91.down_proj", "model.layers.28.mlp.experts.92.down_proj", "model.layers.28.mlp.experts.93.down_proj", "model.layers.28.mlp.experts.94.down_proj", "model.layers.28.mlp.experts.95.down_proj", "model.layers.28.mlp.experts.96.down_proj", "model.layers.28.mlp.experts.97.down_proj", "model.layers.28.mlp.experts.98.down_proj", "model.layers.28.mlp.experts.99.down_proj", "model.layers.28.mlp.experts.100.down_proj", "model.layers.28.mlp.experts.101.down_proj", "model.layers.28.mlp.experts.102.down_proj", "model.layers.28.mlp.experts.103.down_proj", "model.layers.28.mlp.experts.104.down_proj", "model.layers.28.mlp.experts.105.down_proj", "model.layers.28.mlp.experts.106.down_proj", "model.layers.28.mlp.experts.107.down_proj", "model.layers.28.mlp.experts.108.down_proj", "model.layers.28.mlp.experts.109.down_proj", "model.layers.28.mlp.experts.110.down_proj", "model.layers.28.mlp.experts.111.down_proj", "model.layers.28.mlp.experts.112.down_proj", "model.layers.28.mlp.experts.113.down_proj", "model.layers.28.mlp.experts.114.down_proj", "model.layers.28.mlp.experts.115.down_proj", "model.layers.28.mlp.experts.116.down_proj", "model.layers.28.mlp.experts.117.down_proj", "model.layers.28.mlp.experts.118.down_proj", "model.layers.28.mlp.experts.119.down_proj", "model.layers.28.mlp.experts.120.down_proj", "model.layers.28.mlp.experts.121.down_proj", "model.layers.28.mlp.experts.122.down_proj", "model.layers.28.mlp.experts.123.down_proj", "model.layers.28.mlp.experts.124.down_proj", "model.layers.28.mlp.experts.125.down_proj", "model.layers.28.mlp.experts.126.down_proj", "model.layers.28.mlp.experts.127.down_proj", "model.layers.28.mlp.experts.128.down_proj", "model.layers.28.mlp.experts.129.down_proj", "model.layers.28.mlp.experts.130.down_proj", "model.layers.28.mlp.experts.131.down_proj", "model.layers.28.mlp.experts.132.down_proj", "model.layers.28.mlp.experts.133.down_proj", "model.layers.28.mlp.experts.134.down_proj", "model.layers.28.mlp.experts.135.down_proj", "model.layers.28.mlp.experts.136.down_proj", "model.layers.28.mlp.experts.137.down_proj", "model.layers.28.mlp.experts.138.down_proj", "model.layers.28.mlp.experts.139.down_proj", "model.layers.28.mlp.experts.140.down_proj", "model.layers.28.mlp.experts.141.down_proj", "model.layers.28.mlp.experts.142.down_proj", "model.layers.28.mlp.experts.143.down_proj", "model.layers.28.mlp.experts.144.down_proj", "model.layers.28.mlp.experts.145.down_proj", "model.layers.28.mlp.experts.146.down_proj", "model.layers.28.mlp.experts.147.down_proj", "model.layers.28.mlp.experts.148.down_proj", "model.layers.28.mlp.experts.149.down_proj", "model.layers.28.mlp.experts.150.down_proj", "model.layers.28.mlp.experts.151.down_proj", "model.layers.28.mlp.experts.152.down_proj", "model.layers.28.mlp.experts.153.down_proj", "model.layers.28.mlp.experts.154.down_proj", "model.layers.28.mlp.experts.155.down_proj", "model.layers.28.mlp.experts.156.down_proj", "model.layers.28.mlp.experts.157.down_proj", "model.layers.28.mlp.experts.158.down_proj", "model.layers.28.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -4.196723457425798e-05, "dbits": 1258291200 }, { "dkld": -3.521181643009047e-05, "dbits": 2516582400 } ] }, { "idx": 171, "layers": [ "model.layers.29.self_attn.q_proj" ], "candidates": [ { "dkld": -2.761899959295884e-05, "dbits": 62914560 }, { "dkld": -8.312007412313721e-06, "dbits": 125829120 } ] }, { "idx": 172, "layers": [ "model.layers.29.self_attn.k_proj", "model.layers.29.self_attn.v_proj" ], "candidates": [ { "dkld": 8.798406925052474e-05, "dbits": 10485760 }, { "dkld": 8.63242894411087e-06, "dbits": 20971520 } ] }, { "idx": 173, "layers": [ "model.layers.29.self_attn.o_proj" ], "candidates": [ { "dkld": -5.735158920287982e-05, "dbits": 62914560 }, { "dkld": -3.3118901774285836e-05, "dbits": 125829120 } ] }, { "idx": 174, "layers": [ "model.layers.29.mlp.shared_experts.gate_proj", "model.layers.29.mlp.shared_experts.up_proj", "model.layers.29.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -2.8662569820880196e-05, "dbits": 23592960 }, { "dkld": 3.525721840560471e-05, "dbits": 47185920 } ] }, { "idx": 175, "layers": [ "model.layers.29.mlp.experts.0.gate_proj", "model.layers.29.mlp.experts.1.gate_proj", "model.layers.29.mlp.experts.2.gate_proj", "model.layers.29.mlp.experts.3.gate_proj", "model.layers.29.mlp.experts.4.gate_proj", "model.layers.29.mlp.experts.5.gate_proj", "model.layers.29.mlp.experts.6.gate_proj", "model.layers.29.mlp.experts.7.gate_proj", "model.layers.29.mlp.experts.8.gate_proj", "model.layers.29.mlp.experts.9.gate_proj", "model.layers.29.mlp.experts.10.gate_proj", "model.layers.29.mlp.experts.11.gate_proj", "model.layers.29.mlp.experts.12.gate_proj", "model.layers.29.mlp.experts.13.gate_proj", "model.layers.29.mlp.experts.14.gate_proj", "model.layers.29.mlp.experts.15.gate_proj", "model.layers.29.mlp.experts.16.gate_proj", "model.layers.29.mlp.experts.17.gate_proj", "model.layers.29.mlp.experts.18.gate_proj", "model.layers.29.mlp.experts.19.gate_proj", "model.layers.29.mlp.experts.20.gate_proj", "model.layers.29.mlp.experts.21.gate_proj", "model.layers.29.mlp.experts.22.gate_proj", "model.layers.29.mlp.experts.23.gate_proj", "model.layers.29.mlp.experts.24.gate_proj", "model.layers.29.mlp.experts.25.gate_proj", "model.layers.29.mlp.experts.26.gate_proj", "model.layers.29.mlp.experts.27.gate_proj", "model.layers.29.mlp.experts.28.gate_proj", "model.layers.29.mlp.experts.29.gate_proj", "model.layers.29.mlp.experts.30.gate_proj", "model.layers.29.mlp.experts.31.gate_proj", "model.layers.29.mlp.experts.32.gate_proj", "model.layers.29.mlp.experts.33.gate_proj", "model.layers.29.mlp.experts.34.gate_proj", "model.layers.29.mlp.experts.35.gate_proj", "model.layers.29.mlp.experts.36.gate_proj", "model.layers.29.mlp.experts.37.gate_proj", "model.layers.29.mlp.experts.38.gate_proj", "model.layers.29.mlp.experts.39.gate_proj", "model.layers.29.mlp.experts.40.gate_proj", "model.layers.29.mlp.experts.41.gate_proj", "model.layers.29.mlp.experts.42.gate_proj", "model.layers.29.mlp.experts.43.gate_proj", "model.layers.29.mlp.experts.44.gate_proj", "model.layers.29.mlp.experts.45.gate_proj", "model.layers.29.mlp.experts.46.gate_proj", "model.layers.29.mlp.experts.47.gate_proj", "model.layers.29.mlp.experts.48.gate_proj", "model.layers.29.mlp.experts.49.gate_proj", "model.layers.29.mlp.experts.50.gate_proj", "model.layers.29.mlp.experts.51.gate_proj", "model.layers.29.mlp.experts.52.gate_proj", "model.layers.29.mlp.experts.53.gate_proj", "model.layers.29.mlp.experts.54.gate_proj", "model.layers.29.mlp.experts.55.gate_proj", "model.layers.29.mlp.experts.56.gate_proj", "model.layers.29.mlp.experts.57.gate_proj", "model.layers.29.mlp.experts.58.gate_proj", "model.layers.29.mlp.experts.59.gate_proj", "model.layers.29.mlp.experts.60.gate_proj", "model.layers.29.mlp.experts.61.gate_proj", "model.layers.29.mlp.experts.62.gate_proj", "model.layers.29.mlp.experts.63.gate_proj", "model.layers.29.mlp.experts.64.gate_proj", "model.layers.29.mlp.experts.65.gate_proj", "model.layers.29.mlp.experts.66.gate_proj", "model.layers.29.mlp.experts.67.gate_proj", "model.layers.29.mlp.experts.68.gate_proj", "model.layers.29.mlp.experts.69.gate_proj", "model.layers.29.mlp.experts.70.gate_proj", "model.layers.29.mlp.experts.71.gate_proj", "model.layers.29.mlp.experts.72.gate_proj", "model.layers.29.mlp.experts.73.gate_proj", "model.layers.29.mlp.experts.74.gate_proj", "model.layers.29.mlp.experts.75.gate_proj", "model.layers.29.mlp.experts.76.gate_proj", "model.layers.29.mlp.experts.77.gate_proj", "model.layers.29.mlp.experts.78.gate_proj", "model.layers.29.mlp.experts.79.gate_proj", "model.layers.29.mlp.experts.80.gate_proj", "model.layers.29.mlp.experts.81.gate_proj", "model.layers.29.mlp.experts.82.gate_proj", "model.layers.29.mlp.experts.83.gate_proj", "model.layers.29.mlp.experts.84.gate_proj", "model.layers.29.mlp.experts.85.gate_proj", "model.layers.29.mlp.experts.86.gate_proj", "model.layers.29.mlp.experts.87.gate_proj", "model.layers.29.mlp.experts.88.gate_proj", "model.layers.29.mlp.experts.89.gate_proj", "model.layers.29.mlp.experts.90.gate_proj", "model.layers.29.mlp.experts.91.gate_proj", "model.layers.29.mlp.experts.92.gate_proj", "model.layers.29.mlp.experts.93.gate_proj", "model.layers.29.mlp.experts.94.gate_proj", "model.layers.29.mlp.experts.95.gate_proj", "model.layers.29.mlp.experts.96.gate_proj", "model.layers.29.mlp.experts.97.gate_proj", "model.layers.29.mlp.experts.98.gate_proj", "model.layers.29.mlp.experts.99.gate_proj", "model.layers.29.mlp.experts.100.gate_proj", "model.layers.29.mlp.experts.101.gate_proj", "model.layers.29.mlp.experts.102.gate_proj", "model.layers.29.mlp.experts.103.gate_proj", "model.layers.29.mlp.experts.104.gate_proj", "model.layers.29.mlp.experts.105.gate_proj", "model.layers.29.mlp.experts.106.gate_proj", "model.layers.29.mlp.experts.107.gate_proj", "model.layers.29.mlp.experts.108.gate_proj", "model.layers.29.mlp.experts.109.gate_proj", "model.layers.29.mlp.experts.110.gate_proj", "model.layers.29.mlp.experts.111.gate_proj", "model.layers.29.mlp.experts.112.gate_proj", "model.layers.29.mlp.experts.113.gate_proj", "model.layers.29.mlp.experts.114.gate_proj", "model.layers.29.mlp.experts.115.gate_proj", "model.layers.29.mlp.experts.116.gate_proj", "model.layers.29.mlp.experts.117.gate_proj", "model.layers.29.mlp.experts.118.gate_proj", "model.layers.29.mlp.experts.119.gate_proj", "model.layers.29.mlp.experts.120.gate_proj", "model.layers.29.mlp.experts.121.gate_proj", "model.layers.29.mlp.experts.122.gate_proj", "model.layers.29.mlp.experts.123.gate_proj", "model.layers.29.mlp.experts.124.gate_proj", "model.layers.29.mlp.experts.125.gate_proj", "model.layers.29.mlp.experts.126.gate_proj", "model.layers.29.mlp.experts.127.gate_proj", "model.layers.29.mlp.experts.128.gate_proj", "model.layers.29.mlp.experts.129.gate_proj", "model.layers.29.mlp.experts.130.gate_proj", "model.layers.29.mlp.experts.131.gate_proj", "model.layers.29.mlp.experts.132.gate_proj", "model.layers.29.mlp.experts.133.gate_proj", "model.layers.29.mlp.experts.134.gate_proj", "model.layers.29.mlp.experts.135.gate_proj", "model.layers.29.mlp.experts.136.gate_proj", "model.layers.29.mlp.experts.137.gate_proj", "model.layers.29.mlp.experts.138.gate_proj", "model.layers.29.mlp.experts.139.gate_proj", "model.layers.29.mlp.experts.140.gate_proj", "model.layers.29.mlp.experts.141.gate_proj", "model.layers.29.mlp.experts.142.gate_proj", "model.layers.29.mlp.experts.143.gate_proj", "model.layers.29.mlp.experts.144.gate_proj", "model.layers.29.mlp.experts.145.gate_proj", "model.layers.29.mlp.experts.146.gate_proj", "model.layers.29.mlp.experts.147.gate_proj", "model.layers.29.mlp.experts.148.gate_proj", "model.layers.29.mlp.experts.149.gate_proj", "model.layers.29.mlp.experts.150.gate_proj", "model.layers.29.mlp.experts.151.gate_proj", "model.layers.29.mlp.experts.152.gate_proj", "model.layers.29.mlp.experts.153.gate_proj", "model.layers.29.mlp.experts.154.gate_proj", "model.layers.29.mlp.experts.155.gate_proj", "model.layers.29.mlp.experts.156.gate_proj", "model.layers.29.mlp.experts.157.gate_proj", "model.layers.29.mlp.experts.158.gate_proj", "model.layers.29.mlp.experts.159.gate_proj", "model.layers.29.mlp.experts.0.up_proj", "model.layers.29.mlp.experts.1.up_proj", "model.layers.29.mlp.experts.2.up_proj", "model.layers.29.mlp.experts.3.up_proj", "model.layers.29.mlp.experts.4.up_proj", "model.layers.29.mlp.experts.5.up_proj", "model.layers.29.mlp.experts.6.up_proj", "model.layers.29.mlp.experts.7.up_proj", "model.layers.29.mlp.experts.8.up_proj", "model.layers.29.mlp.experts.9.up_proj", "model.layers.29.mlp.experts.10.up_proj", "model.layers.29.mlp.experts.11.up_proj", "model.layers.29.mlp.experts.12.up_proj", "model.layers.29.mlp.experts.13.up_proj", "model.layers.29.mlp.experts.14.up_proj", "model.layers.29.mlp.experts.15.up_proj", "model.layers.29.mlp.experts.16.up_proj", "model.layers.29.mlp.experts.17.up_proj", "model.layers.29.mlp.experts.18.up_proj", "model.layers.29.mlp.experts.19.up_proj", "model.layers.29.mlp.experts.20.up_proj", "model.layers.29.mlp.experts.21.up_proj", "model.layers.29.mlp.experts.22.up_proj", "model.layers.29.mlp.experts.23.up_proj", "model.layers.29.mlp.experts.24.up_proj", "model.layers.29.mlp.experts.25.up_proj", "model.layers.29.mlp.experts.26.up_proj", "model.layers.29.mlp.experts.27.up_proj", "model.layers.29.mlp.experts.28.up_proj", "model.layers.29.mlp.experts.29.up_proj", "model.layers.29.mlp.experts.30.up_proj", "model.layers.29.mlp.experts.31.up_proj", "model.layers.29.mlp.experts.32.up_proj", "model.layers.29.mlp.experts.33.up_proj", "model.layers.29.mlp.experts.34.up_proj", "model.layers.29.mlp.experts.35.up_proj", "model.layers.29.mlp.experts.36.up_proj", "model.layers.29.mlp.experts.37.up_proj", "model.layers.29.mlp.experts.38.up_proj", "model.layers.29.mlp.experts.39.up_proj", "model.layers.29.mlp.experts.40.up_proj", "model.layers.29.mlp.experts.41.up_proj", "model.layers.29.mlp.experts.42.up_proj", "model.layers.29.mlp.experts.43.up_proj", "model.layers.29.mlp.experts.44.up_proj", "model.layers.29.mlp.experts.45.up_proj", "model.layers.29.mlp.experts.46.up_proj", "model.layers.29.mlp.experts.47.up_proj", "model.layers.29.mlp.experts.48.up_proj", "model.layers.29.mlp.experts.49.up_proj", "model.layers.29.mlp.experts.50.up_proj", "model.layers.29.mlp.experts.51.up_proj", "model.layers.29.mlp.experts.52.up_proj", "model.layers.29.mlp.experts.53.up_proj", "model.layers.29.mlp.experts.54.up_proj", "model.layers.29.mlp.experts.55.up_proj", "model.layers.29.mlp.experts.56.up_proj", "model.layers.29.mlp.experts.57.up_proj", "model.layers.29.mlp.experts.58.up_proj", "model.layers.29.mlp.experts.59.up_proj", "model.layers.29.mlp.experts.60.up_proj", "model.layers.29.mlp.experts.61.up_proj", "model.layers.29.mlp.experts.62.up_proj", "model.layers.29.mlp.experts.63.up_proj", "model.layers.29.mlp.experts.64.up_proj", "model.layers.29.mlp.experts.65.up_proj", "model.layers.29.mlp.experts.66.up_proj", "model.layers.29.mlp.experts.67.up_proj", "model.layers.29.mlp.experts.68.up_proj", "model.layers.29.mlp.experts.69.up_proj", "model.layers.29.mlp.experts.70.up_proj", "model.layers.29.mlp.experts.71.up_proj", "model.layers.29.mlp.experts.72.up_proj", "model.layers.29.mlp.experts.73.up_proj", "model.layers.29.mlp.experts.74.up_proj", "model.layers.29.mlp.experts.75.up_proj", "model.layers.29.mlp.experts.76.up_proj", "model.layers.29.mlp.experts.77.up_proj", "model.layers.29.mlp.experts.78.up_proj", "model.layers.29.mlp.experts.79.up_proj", "model.layers.29.mlp.experts.80.up_proj", "model.layers.29.mlp.experts.81.up_proj", "model.layers.29.mlp.experts.82.up_proj", "model.layers.29.mlp.experts.83.up_proj", "model.layers.29.mlp.experts.84.up_proj", "model.layers.29.mlp.experts.85.up_proj", "model.layers.29.mlp.experts.86.up_proj", "model.layers.29.mlp.experts.87.up_proj", "model.layers.29.mlp.experts.88.up_proj", "model.layers.29.mlp.experts.89.up_proj", "model.layers.29.mlp.experts.90.up_proj", "model.layers.29.mlp.experts.91.up_proj", "model.layers.29.mlp.experts.92.up_proj", "model.layers.29.mlp.experts.93.up_proj", "model.layers.29.mlp.experts.94.up_proj", "model.layers.29.mlp.experts.95.up_proj", "model.layers.29.mlp.experts.96.up_proj", "model.layers.29.mlp.experts.97.up_proj", "model.layers.29.mlp.experts.98.up_proj", "model.layers.29.mlp.experts.99.up_proj", "model.layers.29.mlp.experts.100.up_proj", "model.layers.29.mlp.experts.101.up_proj", "model.layers.29.mlp.experts.102.up_proj", "model.layers.29.mlp.experts.103.up_proj", "model.layers.29.mlp.experts.104.up_proj", "model.layers.29.mlp.experts.105.up_proj", "model.layers.29.mlp.experts.106.up_proj", "model.layers.29.mlp.experts.107.up_proj", "model.layers.29.mlp.experts.108.up_proj", "model.layers.29.mlp.experts.109.up_proj", "model.layers.29.mlp.experts.110.up_proj", "model.layers.29.mlp.experts.111.up_proj", "model.layers.29.mlp.experts.112.up_proj", "model.layers.29.mlp.experts.113.up_proj", "model.layers.29.mlp.experts.114.up_proj", "model.layers.29.mlp.experts.115.up_proj", "model.layers.29.mlp.experts.116.up_proj", "model.layers.29.mlp.experts.117.up_proj", "model.layers.29.mlp.experts.118.up_proj", "model.layers.29.mlp.experts.119.up_proj", "model.layers.29.mlp.experts.120.up_proj", "model.layers.29.mlp.experts.121.up_proj", "model.layers.29.mlp.experts.122.up_proj", "model.layers.29.mlp.experts.123.up_proj", "model.layers.29.mlp.experts.124.up_proj", "model.layers.29.mlp.experts.125.up_proj", "model.layers.29.mlp.experts.126.up_proj", "model.layers.29.mlp.experts.127.up_proj", "model.layers.29.mlp.experts.128.up_proj", "model.layers.29.mlp.experts.129.up_proj", "model.layers.29.mlp.experts.130.up_proj", "model.layers.29.mlp.experts.131.up_proj", "model.layers.29.mlp.experts.132.up_proj", "model.layers.29.mlp.experts.133.up_proj", "model.layers.29.mlp.experts.134.up_proj", "model.layers.29.mlp.experts.135.up_proj", "model.layers.29.mlp.experts.136.up_proj", "model.layers.29.mlp.experts.137.up_proj", "model.layers.29.mlp.experts.138.up_proj", "model.layers.29.mlp.experts.139.up_proj", "model.layers.29.mlp.experts.140.up_proj", "model.layers.29.mlp.experts.141.up_proj", "model.layers.29.mlp.experts.142.up_proj", "model.layers.29.mlp.experts.143.up_proj", "model.layers.29.mlp.experts.144.up_proj", "model.layers.29.mlp.experts.145.up_proj", "model.layers.29.mlp.experts.146.up_proj", "model.layers.29.mlp.experts.147.up_proj", "model.layers.29.mlp.experts.148.up_proj", "model.layers.29.mlp.experts.149.up_proj", "model.layers.29.mlp.experts.150.up_proj", "model.layers.29.mlp.experts.151.up_proj", "model.layers.29.mlp.experts.152.up_proj", "model.layers.29.mlp.experts.153.up_proj", "model.layers.29.mlp.experts.154.up_proj", "model.layers.29.mlp.experts.155.up_proj", "model.layers.29.mlp.experts.156.up_proj", "model.layers.29.mlp.experts.157.up_proj", "model.layers.29.mlp.experts.158.up_proj", "model.layers.29.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.9633909687389456e-06, "dbits": 2516582400 }, { "dkld": -3.9496971294282826e-05, "dbits": 5033164800 } ] }, { "idx": 176, "layers": [ "model.layers.29.mlp.experts.0.down_proj", "model.layers.29.mlp.experts.1.down_proj", "model.layers.29.mlp.experts.2.down_proj", "model.layers.29.mlp.experts.3.down_proj", "model.layers.29.mlp.experts.4.down_proj", "model.layers.29.mlp.experts.5.down_proj", "model.layers.29.mlp.experts.6.down_proj", "model.layers.29.mlp.experts.7.down_proj", "model.layers.29.mlp.experts.8.down_proj", "model.layers.29.mlp.experts.9.down_proj", "model.layers.29.mlp.experts.10.down_proj", "model.layers.29.mlp.experts.11.down_proj", "model.layers.29.mlp.experts.12.down_proj", "model.layers.29.mlp.experts.13.down_proj", "model.layers.29.mlp.experts.14.down_proj", "model.layers.29.mlp.experts.15.down_proj", "model.layers.29.mlp.experts.16.down_proj", "model.layers.29.mlp.experts.17.down_proj", "model.layers.29.mlp.experts.18.down_proj", "model.layers.29.mlp.experts.19.down_proj", "model.layers.29.mlp.experts.20.down_proj", "model.layers.29.mlp.experts.21.down_proj", "model.layers.29.mlp.experts.22.down_proj", "model.layers.29.mlp.experts.23.down_proj", "model.layers.29.mlp.experts.24.down_proj", "model.layers.29.mlp.experts.25.down_proj", "model.layers.29.mlp.experts.26.down_proj", "model.layers.29.mlp.experts.27.down_proj", "model.layers.29.mlp.experts.28.down_proj", "model.layers.29.mlp.experts.29.down_proj", "model.layers.29.mlp.experts.30.down_proj", "model.layers.29.mlp.experts.31.down_proj", "model.layers.29.mlp.experts.32.down_proj", "model.layers.29.mlp.experts.33.down_proj", "model.layers.29.mlp.experts.34.down_proj", "model.layers.29.mlp.experts.35.down_proj", "model.layers.29.mlp.experts.36.down_proj", "model.layers.29.mlp.experts.37.down_proj", "model.layers.29.mlp.experts.38.down_proj", "model.layers.29.mlp.experts.39.down_proj", "model.layers.29.mlp.experts.40.down_proj", "model.layers.29.mlp.experts.41.down_proj", "model.layers.29.mlp.experts.42.down_proj", "model.layers.29.mlp.experts.43.down_proj", "model.layers.29.mlp.experts.44.down_proj", "model.layers.29.mlp.experts.45.down_proj", "model.layers.29.mlp.experts.46.down_proj", "model.layers.29.mlp.experts.47.down_proj", "model.layers.29.mlp.experts.48.down_proj", "model.layers.29.mlp.experts.49.down_proj", "model.layers.29.mlp.experts.50.down_proj", "model.layers.29.mlp.experts.51.down_proj", "model.layers.29.mlp.experts.52.down_proj", "model.layers.29.mlp.experts.53.down_proj", "model.layers.29.mlp.experts.54.down_proj", "model.layers.29.mlp.experts.55.down_proj", "model.layers.29.mlp.experts.56.down_proj", "model.layers.29.mlp.experts.57.down_proj", "model.layers.29.mlp.experts.58.down_proj", "model.layers.29.mlp.experts.59.down_proj", "model.layers.29.mlp.experts.60.down_proj", "model.layers.29.mlp.experts.61.down_proj", "model.layers.29.mlp.experts.62.down_proj", "model.layers.29.mlp.experts.63.down_proj", "model.layers.29.mlp.experts.64.down_proj", "model.layers.29.mlp.experts.65.down_proj", "model.layers.29.mlp.experts.66.down_proj", "model.layers.29.mlp.experts.67.down_proj", "model.layers.29.mlp.experts.68.down_proj", "model.layers.29.mlp.experts.69.down_proj", "model.layers.29.mlp.experts.70.down_proj", "model.layers.29.mlp.experts.71.down_proj", "model.layers.29.mlp.experts.72.down_proj", "model.layers.29.mlp.experts.73.down_proj", "model.layers.29.mlp.experts.74.down_proj", "model.layers.29.mlp.experts.75.down_proj", "model.layers.29.mlp.experts.76.down_proj", "model.layers.29.mlp.experts.77.down_proj", "model.layers.29.mlp.experts.78.down_proj", "model.layers.29.mlp.experts.79.down_proj", "model.layers.29.mlp.experts.80.down_proj", "model.layers.29.mlp.experts.81.down_proj", "model.layers.29.mlp.experts.82.down_proj", "model.layers.29.mlp.experts.83.down_proj", "model.layers.29.mlp.experts.84.down_proj", "model.layers.29.mlp.experts.85.down_proj", "model.layers.29.mlp.experts.86.down_proj", "model.layers.29.mlp.experts.87.down_proj", "model.layers.29.mlp.experts.88.down_proj", "model.layers.29.mlp.experts.89.down_proj", "model.layers.29.mlp.experts.90.down_proj", "model.layers.29.mlp.experts.91.down_proj", "model.layers.29.mlp.experts.92.down_proj", "model.layers.29.mlp.experts.93.down_proj", "model.layers.29.mlp.experts.94.down_proj", "model.layers.29.mlp.experts.95.down_proj", "model.layers.29.mlp.experts.96.down_proj", "model.layers.29.mlp.experts.97.down_proj", "model.layers.29.mlp.experts.98.down_proj", "model.layers.29.mlp.experts.99.down_proj", "model.layers.29.mlp.experts.100.down_proj", "model.layers.29.mlp.experts.101.down_proj", "model.layers.29.mlp.experts.102.down_proj", "model.layers.29.mlp.experts.103.down_proj", "model.layers.29.mlp.experts.104.down_proj", "model.layers.29.mlp.experts.105.down_proj", "model.layers.29.mlp.experts.106.down_proj", "model.layers.29.mlp.experts.107.down_proj", "model.layers.29.mlp.experts.108.down_proj", "model.layers.29.mlp.experts.109.down_proj", "model.layers.29.mlp.experts.110.down_proj", "model.layers.29.mlp.experts.111.down_proj", "model.layers.29.mlp.experts.112.down_proj", "model.layers.29.mlp.experts.113.down_proj", "model.layers.29.mlp.experts.114.down_proj", "model.layers.29.mlp.experts.115.down_proj", "model.layers.29.mlp.experts.116.down_proj", "model.layers.29.mlp.experts.117.down_proj", "model.layers.29.mlp.experts.118.down_proj", "model.layers.29.mlp.experts.119.down_proj", "model.layers.29.mlp.experts.120.down_proj", "model.layers.29.mlp.experts.121.down_proj", "model.layers.29.mlp.experts.122.down_proj", "model.layers.29.mlp.experts.123.down_proj", "model.layers.29.mlp.experts.124.down_proj", "model.layers.29.mlp.experts.125.down_proj", "model.layers.29.mlp.experts.126.down_proj", "model.layers.29.mlp.experts.127.down_proj", "model.layers.29.mlp.experts.128.down_proj", "model.layers.29.mlp.experts.129.down_proj", "model.layers.29.mlp.experts.130.down_proj", "model.layers.29.mlp.experts.131.down_proj", "model.layers.29.mlp.experts.132.down_proj", "model.layers.29.mlp.experts.133.down_proj", "model.layers.29.mlp.experts.134.down_proj", "model.layers.29.mlp.experts.135.down_proj", "model.layers.29.mlp.experts.136.down_proj", "model.layers.29.mlp.experts.137.down_proj", "model.layers.29.mlp.experts.138.down_proj", "model.layers.29.mlp.experts.139.down_proj", "model.layers.29.mlp.experts.140.down_proj", "model.layers.29.mlp.experts.141.down_proj", "model.layers.29.mlp.experts.142.down_proj", "model.layers.29.mlp.experts.143.down_proj", "model.layers.29.mlp.experts.144.down_proj", "model.layers.29.mlp.experts.145.down_proj", "model.layers.29.mlp.experts.146.down_proj", "model.layers.29.mlp.experts.147.down_proj", "model.layers.29.mlp.experts.148.down_proj", "model.layers.29.mlp.experts.149.down_proj", "model.layers.29.mlp.experts.150.down_proj", "model.layers.29.mlp.experts.151.down_proj", "model.layers.29.mlp.experts.152.down_proj", "model.layers.29.mlp.experts.153.down_proj", "model.layers.29.mlp.experts.154.down_proj", "model.layers.29.mlp.experts.155.down_proj", "model.layers.29.mlp.experts.156.down_proj", "model.layers.29.mlp.experts.157.down_proj", "model.layers.29.mlp.experts.158.down_proj", "model.layers.29.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.9141781851642345e-06, "dbits": 1258291200 }, { "dkld": -4.371278919279575e-06, "dbits": 2516582400 } ] }, { "idx": 177, "layers": [ "model.layers.30.self_attn.q_proj" ], "candidates": [ { "dkld": -2.4990178644646727e-06, "dbits": 62914560 }, { "dkld": -1.6651116311536263e-06, "dbits": 125829120 } ] }, { "idx": 178, "layers": [ "model.layers.30.self_attn.k_proj", "model.layers.30.self_attn.v_proj" ], "candidates": [ { "dkld": -2.8825132176273083e-06, "dbits": 10485760 }, { "dkld": -5.181771703064407e-05, "dbits": 20971520 } ] }, { "idx": 179, "layers": [ "model.layers.30.self_attn.o_proj" ], "candidates": [ { "dkld": -4.720778670161928e-05, "dbits": 62914560 }, { "dkld": -0.00011212106328457525, "dbits": 125829120 } ] }, { "idx": 180, "layers": [ "model.layers.30.mlp.shared_experts.gate_proj", "model.layers.30.mlp.shared_experts.up_proj", "model.layers.30.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.00011625331826507941, "dbits": 23592960 }, { "dkld": -6.669294089078903e-05, "dbits": 47185920 } ] }, { "idx": 181, "layers": [ "model.layers.30.mlp.experts.0.gate_proj", "model.layers.30.mlp.experts.1.gate_proj", "model.layers.30.mlp.experts.2.gate_proj", "model.layers.30.mlp.experts.3.gate_proj", "model.layers.30.mlp.experts.4.gate_proj", "model.layers.30.mlp.experts.5.gate_proj", "model.layers.30.mlp.experts.6.gate_proj", "model.layers.30.mlp.experts.7.gate_proj", "model.layers.30.mlp.experts.8.gate_proj", "model.layers.30.mlp.experts.9.gate_proj", "model.layers.30.mlp.experts.10.gate_proj", "model.layers.30.mlp.experts.11.gate_proj", "model.layers.30.mlp.experts.12.gate_proj", "model.layers.30.mlp.experts.13.gate_proj", "model.layers.30.mlp.experts.14.gate_proj", "model.layers.30.mlp.experts.15.gate_proj", "model.layers.30.mlp.experts.16.gate_proj", "model.layers.30.mlp.experts.17.gate_proj", "model.layers.30.mlp.experts.18.gate_proj", "model.layers.30.mlp.experts.19.gate_proj", "model.layers.30.mlp.experts.20.gate_proj", "model.layers.30.mlp.experts.21.gate_proj", "model.layers.30.mlp.experts.22.gate_proj", "model.layers.30.mlp.experts.23.gate_proj", "model.layers.30.mlp.experts.24.gate_proj", "model.layers.30.mlp.experts.25.gate_proj", "model.layers.30.mlp.experts.26.gate_proj", "model.layers.30.mlp.experts.27.gate_proj", "model.layers.30.mlp.experts.28.gate_proj", "model.layers.30.mlp.experts.29.gate_proj", "model.layers.30.mlp.experts.30.gate_proj", "model.layers.30.mlp.experts.31.gate_proj", "model.layers.30.mlp.experts.32.gate_proj", "model.layers.30.mlp.experts.33.gate_proj", "model.layers.30.mlp.experts.34.gate_proj", "model.layers.30.mlp.experts.35.gate_proj", "model.layers.30.mlp.experts.36.gate_proj", "model.layers.30.mlp.experts.37.gate_proj", "model.layers.30.mlp.experts.38.gate_proj", "model.layers.30.mlp.experts.39.gate_proj", "model.layers.30.mlp.experts.40.gate_proj", "model.layers.30.mlp.experts.41.gate_proj", "model.layers.30.mlp.experts.42.gate_proj", "model.layers.30.mlp.experts.43.gate_proj", "model.layers.30.mlp.experts.44.gate_proj", "model.layers.30.mlp.experts.45.gate_proj", "model.layers.30.mlp.experts.46.gate_proj", "model.layers.30.mlp.experts.47.gate_proj", "model.layers.30.mlp.experts.48.gate_proj", "model.layers.30.mlp.experts.49.gate_proj", "model.layers.30.mlp.experts.50.gate_proj", "model.layers.30.mlp.experts.51.gate_proj", "model.layers.30.mlp.experts.52.gate_proj", "model.layers.30.mlp.experts.53.gate_proj", "model.layers.30.mlp.experts.54.gate_proj", "model.layers.30.mlp.experts.55.gate_proj", "model.layers.30.mlp.experts.56.gate_proj", "model.layers.30.mlp.experts.57.gate_proj", "model.layers.30.mlp.experts.58.gate_proj", "model.layers.30.mlp.experts.59.gate_proj", "model.layers.30.mlp.experts.60.gate_proj", "model.layers.30.mlp.experts.61.gate_proj", "model.layers.30.mlp.experts.62.gate_proj", "model.layers.30.mlp.experts.63.gate_proj", "model.layers.30.mlp.experts.64.gate_proj", "model.layers.30.mlp.experts.65.gate_proj", "model.layers.30.mlp.experts.66.gate_proj", "model.layers.30.mlp.experts.67.gate_proj", "model.layers.30.mlp.experts.68.gate_proj", "model.layers.30.mlp.experts.69.gate_proj", "model.layers.30.mlp.experts.70.gate_proj", "model.layers.30.mlp.experts.71.gate_proj", "model.layers.30.mlp.experts.72.gate_proj", "model.layers.30.mlp.experts.73.gate_proj", "model.layers.30.mlp.experts.74.gate_proj", "model.layers.30.mlp.experts.75.gate_proj", "model.layers.30.mlp.experts.76.gate_proj", "model.layers.30.mlp.experts.77.gate_proj", "model.layers.30.mlp.experts.78.gate_proj", "model.layers.30.mlp.experts.79.gate_proj", "model.layers.30.mlp.experts.80.gate_proj", "model.layers.30.mlp.experts.81.gate_proj", "model.layers.30.mlp.experts.82.gate_proj", "model.layers.30.mlp.experts.83.gate_proj", "model.layers.30.mlp.experts.84.gate_proj", "model.layers.30.mlp.experts.85.gate_proj", "model.layers.30.mlp.experts.86.gate_proj", "model.layers.30.mlp.experts.87.gate_proj", "model.layers.30.mlp.experts.88.gate_proj", "model.layers.30.mlp.experts.89.gate_proj", "model.layers.30.mlp.experts.90.gate_proj", "model.layers.30.mlp.experts.91.gate_proj", "model.layers.30.mlp.experts.92.gate_proj", "model.layers.30.mlp.experts.93.gate_proj", "model.layers.30.mlp.experts.94.gate_proj", "model.layers.30.mlp.experts.95.gate_proj", "model.layers.30.mlp.experts.96.gate_proj", "model.layers.30.mlp.experts.97.gate_proj", "model.layers.30.mlp.experts.98.gate_proj", "model.layers.30.mlp.experts.99.gate_proj", "model.layers.30.mlp.experts.100.gate_proj", "model.layers.30.mlp.experts.101.gate_proj", "model.layers.30.mlp.experts.102.gate_proj", "model.layers.30.mlp.experts.103.gate_proj", "model.layers.30.mlp.experts.104.gate_proj", "model.layers.30.mlp.experts.105.gate_proj", "model.layers.30.mlp.experts.106.gate_proj", "model.layers.30.mlp.experts.107.gate_proj", "model.layers.30.mlp.experts.108.gate_proj", "model.layers.30.mlp.experts.109.gate_proj", "model.layers.30.mlp.experts.110.gate_proj", "model.layers.30.mlp.experts.111.gate_proj", "model.layers.30.mlp.experts.112.gate_proj", "model.layers.30.mlp.experts.113.gate_proj", "model.layers.30.mlp.experts.114.gate_proj", "model.layers.30.mlp.experts.115.gate_proj", "model.layers.30.mlp.experts.116.gate_proj", "model.layers.30.mlp.experts.117.gate_proj", "model.layers.30.mlp.experts.118.gate_proj", "model.layers.30.mlp.experts.119.gate_proj", "model.layers.30.mlp.experts.120.gate_proj", "model.layers.30.mlp.experts.121.gate_proj", "model.layers.30.mlp.experts.122.gate_proj", "model.layers.30.mlp.experts.123.gate_proj", "model.layers.30.mlp.experts.124.gate_proj", "model.layers.30.mlp.experts.125.gate_proj", "model.layers.30.mlp.experts.126.gate_proj", "model.layers.30.mlp.experts.127.gate_proj", "model.layers.30.mlp.experts.128.gate_proj", "model.layers.30.mlp.experts.129.gate_proj", "model.layers.30.mlp.experts.130.gate_proj", "model.layers.30.mlp.experts.131.gate_proj", "model.layers.30.mlp.experts.132.gate_proj", "model.layers.30.mlp.experts.133.gate_proj", "model.layers.30.mlp.experts.134.gate_proj", "model.layers.30.mlp.experts.135.gate_proj", "model.layers.30.mlp.experts.136.gate_proj", "model.layers.30.mlp.experts.137.gate_proj", "model.layers.30.mlp.experts.138.gate_proj", "model.layers.30.mlp.experts.139.gate_proj", "model.layers.30.mlp.experts.140.gate_proj", "model.layers.30.mlp.experts.141.gate_proj", "model.layers.30.mlp.experts.142.gate_proj", "model.layers.30.mlp.experts.143.gate_proj", "model.layers.30.mlp.experts.144.gate_proj", "model.layers.30.mlp.experts.145.gate_proj", "model.layers.30.mlp.experts.146.gate_proj", "model.layers.30.mlp.experts.147.gate_proj", "model.layers.30.mlp.experts.148.gate_proj", "model.layers.30.mlp.experts.149.gate_proj", "model.layers.30.mlp.experts.150.gate_proj", "model.layers.30.mlp.experts.151.gate_proj", "model.layers.30.mlp.experts.152.gate_proj", "model.layers.30.mlp.experts.153.gate_proj", "model.layers.30.mlp.experts.154.gate_proj", "model.layers.30.mlp.experts.155.gate_proj", "model.layers.30.mlp.experts.156.gate_proj", "model.layers.30.mlp.experts.157.gate_proj", "model.layers.30.mlp.experts.158.gate_proj", "model.layers.30.mlp.experts.159.gate_proj", "model.layers.30.mlp.experts.0.up_proj", "model.layers.30.mlp.experts.1.up_proj", "model.layers.30.mlp.experts.2.up_proj", "model.layers.30.mlp.experts.3.up_proj", "model.layers.30.mlp.experts.4.up_proj", "model.layers.30.mlp.experts.5.up_proj", "model.layers.30.mlp.experts.6.up_proj", "model.layers.30.mlp.experts.7.up_proj", "model.layers.30.mlp.experts.8.up_proj", "model.layers.30.mlp.experts.9.up_proj", "model.layers.30.mlp.experts.10.up_proj", "model.layers.30.mlp.experts.11.up_proj", "model.layers.30.mlp.experts.12.up_proj", "model.layers.30.mlp.experts.13.up_proj", "model.layers.30.mlp.experts.14.up_proj", "model.layers.30.mlp.experts.15.up_proj", "model.layers.30.mlp.experts.16.up_proj", "model.layers.30.mlp.experts.17.up_proj", "model.layers.30.mlp.experts.18.up_proj", "model.layers.30.mlp.experts.19.up_proj", "model.layers.30.mlp.experts.20.up_proj", "model.layers.30.mlp.experts.21.up_proj", "model.layers.30.mlp.experts.22.up_proj", "model.layers.30.mlp.experts.23.up_proj", "model.layers.30.mlp.experts.24.up_proj", "model.layers.30.mlp.experts.25.up_proj", "model.layers.30.mlp.experts.26.up_proj", "model.layers.30.mlp.experts.27.up_proj", "model.layers.30.mlp.experts.28.up_proj", "model.layers.30.mlp.experts.29.up_proj", "model.layers.30.mlp.experts.30.up_proj", "model.layers.30.mlp.experts.31.up_proj", "model.layers.30.mlp.experts.32.up_proj", "model.layers.30.mlp.experts.33.up_proj", "model.layers.30.mlp.experts.34.up_proj", "model.layers.30.mlp.experts.35.up_proj", "model.layers.30.mlp.experts.36.up_proj", "model.layers.30.mlp.experts.37.up_proj", "model.layers.30.mlp.experts.38.up_proj", "model.layers.30.mlp.experts.39.up_proj", "model.layers.30.mlp.experts.40.up_proj", "model.layers.30.mlp.experts.41.up_proj", "model.layers.30.mlp.experts.42.up_proj", "model.layers.30.mlp.experts.43.up_proj", "model.layers.30.mlp.experts.44.up_proj", "model.layers.30.mlp.experts.45.up_proj", "model.layers.30.mlp.experts.46.up_proj", "model.layers.30.mlp.experts.47.up_proj", "model.layers.30.mlp.experts.48.up_proj", "model.layers.30.mlp.experts.49.up_proj", "model.layers.30.mlp.experts.50.up_proj", "model.layers.30.mlp.experts.51.up_proj", "model.layers.30.mlp.experts.52.up_proj", "model.layers.30.mlp.experts.53.up_proj", "model.layers.30.mlp.experts.54.up_proj", "model.layers.30.mlp.experts.55.up_proj", "model.layers.30.mlp.experts.56.up_proj", "model.layers.30.mlp.experts.57.up_proj", "model.layers.30.mlp.experts.58.up_proj", "model.layers.30.mlp.experts.59.up_proj", "model.layers.30.mlp.experts.60.up_proj", "model.layers.30.mlp.experts.61.up_proj", "model.layers.30.mlp.experts.62.up_proj", "model.layers.30.mlp.experts.63.up_proj", "model.layers.30.mlp.experts.64.up_proj", "model.layers.30.mlp.experts.65.up_proj", "model.layers.30.mlp.experts.66.up_proj", "model.layers.30.mlp.experts.67.up_proj", "model.layers.30.mlp.experts.68.up_proj", "model.layers.30.mlp.experts.69.up_proj", "model.layers.30.mlp.experts.70.up_proj", "model.layers.30.mlp.experts.71.up_proj", "model.layers.30.mlp.experts.72.up_proj", "model.layers.30.mlp.experts.73.up_proj", "model.layers.30.mlp.experts.74.up_proj", "model.layers.30.mlp.experts.75.up_proj", "model.layers.30.mlp.experts.76.up_proj", "model.layers.30.mlp.experts.77.up_proj", "model.layers.30.mlp.experts.78.up_proj", "model.layers.30.mlp.experts.79.up_proj", "model.layers.30.mlp.experts.80.up_proj", "model.layers.30.mlp.experts.81.up_proj", "model.layers.30.mlp.experts.82.up_proj", "model.layers.30.mlp.experts.83.up_proj", "model.layers.30.mlp.experts.84.up_proj", "model.layers.30.mlp.experts.85.up_proj", "model.layers.30.mlp.experts.86.up_proj", "model.layers.30.mlp.experts.87.up_proj", "model.layers.30.mlp.experts.88.up_proj", "model.layers.30.mlp.experts.89.up_proj", "model.layers.30.mlp.experts.90.up_proj", "model.layers.30.mlp.experts.91.up_proj", "model.layers.30.mlp.experts.92.up_proj", "model.layers.30.mlp.experts.93.up_proj", "model.layers.30.mlp.experts.94.up_proj", "model.layers.30.mlp.experts.95.up_proj", "model.layers.30.mlp.experts.96.up_proj", "model.layers.30.mlp.experts.97.up_proj", "model.layers.30.mlp.experts.98.up_proj", "model.layers.30.mlp.experts.99.up_proj", "model.layers.30.mlp.experts.100.up_proj", "model.layers.30.mlp.experts.101.up_proj", "model.layers.30.mlp.experts.102.up_proj", "model.layers.30.mlp.experts.103.up_proj", "model.layers.30.mlp.experts.104.up_proj", "model.layers.30.mlp.experts.105.up_proj", "model.layers.30.mlp.experts.106.up_proj", "model.layers.30.mlp.experts.107.up_proj", "model.layers.30.mlp.experts.108.up_proj", "model.layers.30.mlp.experts.109.up_proj", "model.layers.30.mlp.experts.110.up_proj", "model.layers.30.mlp.experts.111.up_proj", "model.layers.30.mlp.experts.112.up_proj", "model.layers.30.mlp.experts.113.up_proj", "model.layers.30.mlp.experts.114.up_proj", "model.layers.30.mlp.experts.115.up_proj", "model.layers.30.mlp.experts.116.up_proj", "model.layers.30.mlp.experts.117.up_proj", "model.layers.30.mlp.experts.118.up_proj", "model.layers.30.mlp.experts.119.up_proj", "model.layers.30.mlp.experts.120.up_proj", "model.layers.30.mlp.experts.121.up_proj", "model.layers.30.mlp.experts.122.up_proj", "model.layers.30.mlp.experts.123.up_proj", "model.layers.30.mlp.experts.124.up_proj", "model.layers.30.mlp.experts.125.up_proj", "model.layers.30.mlp.experts.126.up_proj", "model.layers.30.mlp.experts.127.up_proj", "model.layers.30.mlp.experts.128.up_proj", "model.layers.30.mlp.experts.129.up_proj", "model.layers.30.mlp.experts.130.up_proj", "model.layers.30.mlp.experts.131.up_proj", "model.layers.30.mlp.experts.132.up_proj", "model.layers.30.mlp.experts.133.up_proj", "model.layers.30.mlp.experts.134.up_proj", "model.layers.30.mlp.experts.135.up_proj", "model.layers.30.mlp.experts.136.up_proj", "model.layers.30.mlp.experts.137.up_proj", "model.layers.30.mlp.experts.138.up_proj", "model.layers.30.mlp.experts.139.up_proj", "model.layers.30.mlp.experts.140.up_proj", "model.layers.30.mlp.experts.141.up_proj", "model.layers.30.mlp.experts.142.up_proj", "model.layers.30.mlp.experts.143.up_proj", "model.layers.30.mlp.experts.144.up_proj", "model.layers.30.mlp.experts.145.up_proj", "model.layers.30.mlp.experts.146.up_proj", "model.layers.30.mlp.experts.147.up_proj", "model.layers.30.mlp.experts.148.up_proj", "model.layers.30.mlp.experts.149.up_proj", "model.layers.30.mlp.experts.150.up_proj", "model.layers.30.mlp.experts.151.up_proj", "model.layers.30.mlp.experts.152.up_proj", "model.layers.30.mlp.experts.153.up_proj", "model.layers.30.mlp.experts.154.up_proj", "model.layers.30.mlp.experts.155.up_proj", "model.layers.30.mlp.experts.156.up_proj", "model.layers.30.mlp.experts.157.up_proj", "model.layers.30.mlp.experts.158.up_proj", "model.layers.30.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -6.682053208351135e-05, "dbits": 2516582400 }, { "dkld": -6.944695487618412e-05, "dbits": 5033164800 } ] }, { "idx": 182, "layers": [ "model.layers.30.mlp.experts.0.down_proj", "model.layers.30.mlp.experts.1.down_proj", "model.layers.30.mlp.experts.2.down_proj", "model.layers.30.mlp.experts.3.down_proj", "model.layers.30.mlp.experts.4.down_proj", "model.layers.30.mlp.experts.5.down_proj", "model.layers.30.mlp.experts.6.down_proj", "model.layers.30.mlp.experts.7.down_proj", "model.layers.30.mlp.experts.8.down_proj", "model.layers.30.mlp.experts.9.down_proj", "model.layers.30.mlp.experts.10.down_proj", "model.layers.30.mlp.experts.11.down_proj", "model.layers.30.mlp.experts.12.down_proj", "model.layers.30.mlp.experts.13.down_proj", "model.layers.30.mlp.experts.14.down_proj", "model.layers.30.mlp.experts.15.down_proj", "model.layers.30.mlp.experts.16.down_proj", "model.layers.30.mlp.experts.17.down_proj", "model.layers.30.mlp.experts.18.down_proj", "model.layers.30.mlp.experts.19.down_proj", "model.layers.30.mlp.experts.20.down_proj", "model.layers.30.mlp.experts.21.down_proj", "model.layers.30.mlp.experts.22.down_proj", "model.layers.30.mlp.experts.23.down_proj", "model.layers.30.mlp.experts.24.down_proj", "model.layers.30.mlp.experts.25.down_proj", "model.layers.30.mlp.experts.26.down_proj", "model.layers.30.mlp.experts.27.down_proj", "model.layers.30.mlp.experts.28.down_proj", "model.layers.30.mlp.experts.29.down_proj", "model.layers.30.mlp.experts.30.down_proj", "model.layers.30.mlp.experts.31.down_proj", "model.layers.30.mlp.experts.32.down_proj", "model.layers.30.mlp.experts.33.down_proj", "model.layers.30.mlp.experts.34.down_proj", "model.layers.30.mlp.experts.35.down_proj", "model.layers.30.mlp.experts.36.down_proj", "model.layers.30.mlp.experts.37.down_proj", "model.layers.30.mlp.experts.38.down_proj", "model.layers.30.mlp.experts.39.down_proj", "model.layers.30.mlp.experts.40.down_proj", "model.layers.30.mlp.experts.41.down_proj", "model.layers.30.mlp.experts.42.down_proj", "model.layers.30.mlp.experts.43.down_proj", "model.layers.30.mlp.experts.44.down_proj", "model.layers.30.mlp.experts.45.down_proj", "model.layers.30.mlp.experts.46.down_proj", "model.layers.30.mlp.experts.47.down_proj", "model.layers.30.mlp.experts.48.down_proj", "model.layers.30.mlp.experts.49.down_proj", "model.layers.30.mlp.experts.50.down_proj", "model.layers.30.mlp.experts.51.down_proj", "model.layers.30.mlp.experts.52.down_proj", "model.layers.30.mlp.experts.53.down_proj", "model.layers.30.mlp.experts.54.down_proj", "model.layers.30.mlp.experts.55.down_proj", "model.layers.30.mlp.experts.56.down_proj", "model.layers.30.mlp.experts.57.down_proj", "model.layers.30.mlp.experts.58.down_proj", "model.layers.30.mlp.experts.59.down_proj", "model.layers.30.mlp.experts.60.down_proj", "model.layers.30.mlp.experts.61.down_proj", "model.layers.30.mlp.experts.62.down_proj", "model.layers.30.mlp.experts.63.down_proj", "model.layers.30.mlp.experts.64.down_proj", "model.layers.30.mlp.experts.65.down_proj", "model.layers.30.mlp.experts.66.down_proj", "model.layers.30.mlp.experts.67.down_proj", "model.layers.30.mlp.experts.68.down_proj", "model.layers.30.mlp.experts.69.down_proj", "model.layers.30.mlp.experts.70.down_proj", "model.layers.30.mlp.experts.71.down_proj", "model.layers.30.mlp.experts.72.down_proj", "model.layers.30.mlp.experts.73.down_proj", "model.layers.30.mlp.experts.74.down_proj", "model.layers.30.mlp.experts.75.down_proj", "model.layers.30.mlp.experts.76.down_proj", "model.layers.30.mlp.experts.77.down_proj", "model.layers.30.mlp.experts.78.down_proj", "model.layers.30.mlp.experts.79.down_proj", "model.layers.30.mlp.experts.80.down_proj", "model.layers.30.mlp.experts.81.down_proj", "model.layers.30.mlp.experts.82.down_proj", "model.layers.30.mlp.experts.83.down_proj", "model.layers.30.mlp.experts.84.down_proj", "model.layers.30.mlp.experts.85.down_proj", "model.layers.30.mlp.experts.86.down_proj", "model.layers.30.mlp.experts.87.down_proj", "model.layers.30.mlp.experts.88.down_proj", "model.layers.30.mlp.experts.89.down_proj", "model.layers.30.mlp.experts.90.down_proj", "model.layers.30.mlp.experts.91.down_proj", "model.layers.30.mlp.experts.92.down_proj", "model.layers.30.mlp.experts.93.down_proj", "model.layers.30.mlp.experts.94.down_proj", "model.layers.30.mlp.experts.95.down_proj", "model.layers.30.mlp.experts.96.down_proj", "model.layers.30.mlp.experts.97.down_proj", "model.layers.30.mlp.experts.98.down_proj", "model.layers.30.mlp.experts.99.down_proj", "model.layers.30.mlp.experts.100.down_proj", "model.layers.30.mlp.experts.101.down_proj", "model.layers.30.mlp.experts.102.down_proj", "model.layers.30.mlp.experts.103.down_proj", "model.layers.30.mlp.experts.104.down_proj", "model.layers.30.mlp.experts.105.down_proj", "model.layers.30.mlp.experts.106.down_proj", "model.layers.30.mlp.experts.107.down_proj", "model.layers.30.mlp.experts.108.down_proj", "model.layers.30.mlp.experts.109.down_proj", "model.layers.30.mlp.experts.110.down_proj", "model.layers.30.mlp.experts.111.down_proj", "model.layers.30.mlp.experts.112.down_proj", "model.layers.30.mlp.experts.113.down_proj", "model.layers.30.mlp.experts.114.down_proj", "model.layers.30.mlp.experts.115.down_proj", "model.layers.30.mlp.experts.116.down_proj", "model.layers.30.mlp.experts.117.down_proj", "model.layers.30.mlp.experts.118.down_proj", "model.layers.30.mlp.experts.119.down_proj", "model.layers.30.mlp.experts.120.down_proj", "model.layers.30.mlp.experts.121.down_proj", "model.layers.30.mlp.experts.122.down_proj", "model.layers.30.mlp.experts.123.down_proj", "model.layers.30.mlp.experts.124.down_proj", "model.layers.30.mlp.experts.125.down_proj", "model.layers.30.mlp.experts.126.down_proj", "model.layers.30.mlp.experts.127.down_proj", "model.layers.30.mlp.experts.128.down_proj", "model.layers.30.mlp.experts.129.down_proj", "model.layers.30.mlp.experts.130.down_proj", "model.layers.30.mlp.experts.131.down_proj", "model.layers.30.mlp.experts.132.down_proj", "model.layers.30.mlp.experts.133.down_proj", "model.layers.30.mlp.experts.134.down_proj", "model.layers.30.mlp.experts.135.down_proj", "model.layers.30.mlp.experts.136.down_proj", "model.layers.30.mlp.experts.137.down_proj", "model.layers.30.mlp.experts.138.down_proj", "model.layers.30.mlp.experts.139.down_proj", "model.layers.30.mlp.experts.140.down_proj", "model.layers.30.mlp.experts.141.down_proj", "model.layers.30.mlp.experts.142.down_proj", "model.layers.30.mlp.experts.143.down_proj", "model.layers.30.mlp.experts.144.down_proj", "model.layers.30.mlp.experts.145.down_proj", "model.layers.30.mlp.experts.146.down_proj", "model.layers.30.mlp.experts.147.down_proj", "model.layers.30.mlp.experts.148.down_proj", "model.layers.30.mlp.experts.149.down_proj", "model.layers.30.mlp.experts.150.down_proj", "model.layers.30.mlp.experts.151.down_proj", "model.layers.30.mlp.experts.152.down_proj", "model.layers.30.mlp.experts.153.down_proj", "model.layers.30.mlp.experts.154.down_proj", "model.layers.30.mlp.experts.155.down_proj", "model.layers.30.mlp.experts.156.down_proj", "model.layers.30.mlp.experts.157.down_proj", "model.layers.30.mlp.experts.158.down_proj", "model.layers.30.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.2533535957335732e-05, "dbits": 1258291200 }, { "dkld": -2.89426650851958e-05, "dbits": 2516582400 } ] }, { "idx": 183, "layers": [ "model.layers.31.self_attn.q_proj" ], "candidates": [ { "dkld": 4.990654997527599e-05, "dbits": 62914560 }, { "dkld": -1.365416683256522e-05, "dbits": 125829120 } ] }, { "idx": 184, "layers": [ "model.layers.31.self_attn.k_proj", "model.layers.31.self_attn.v_proj" ], "candidates": [ { "dkld": -0.00030964212492108276, "dbits": 10485760 }, { "dkld": -0.00015468480996787444, "dbits": 20971520 } ] }, { "idx": 185, "layers": [ "model.layers.31.self_attn.o_proj" ], "candidates": [ { "dkld": -0.00012883159797638655, "dbits": 62914560 }, { "dkld": -4.2350380681455135e-05, "dbits": 125829120 } ] }, { "idx": 186, "layers": [ "model.layers.31.mlp.shared_experts.gate_proj", "model.layers.31.mlp.shared_experts.up_proj", "model.layers.31.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.0002930004615336653, "dbits": 23592960 }, { "dkld": -0.0003754340112209313, "dbits": 47185920 } ] }, { "idx": 187, "layers": [ "model.layers.31.mlp.experts.0.gate_proj", "model.layers.31.mlp.experts.1.gate_proj", "model.layers.31.mlp.experts.2.gate_proj", "model.layers.31.mlp.experts.3.gate_proj", "model.layers.31.mlp.experts.4.gate_proj", "model.layers.31.mlp.experts.5.gate_proj", "model.layers.31.mlp.experts.6.gate_proj", "model.layers.31.mlp.experts.7.gate_proj", "model.layers.31.mlp.experts.8.gate_proj", "model.layers.31.mlp.experts.9.gate_proj", "model.layers.31.mlp.experts.10.gate_proj", "model.layers.31.mlp.experts.11.gate_proj", "model.layers.31.mlp.experts.12.gate_proj", "model.layers.31.mlp.experts.13.gate_proj", "model.layers.31.mlp.experts.14.gate_proj", "model.layers.31.mlp.experts.15.gate_proj", "model.layers.31.mlp.experts.16.gate_proj", "model.layers.31.mlp.experts.17.gate_proj", "model.layers.31.mlp.experts.18.gate_proj", "model.layers.31.mlp.experts.19.gate_proj", "model.layers.31.mlp.experts.20.gate_proj", "model.layers.31.mlp.experts.21.gate_proj", "model.layers.31.mlp.experts.22.gate_proj", "model.layers.31.mlp.experts.23.gate_proj", "model.layers.31.mlp.experts.24.gate_proj", "model.layers.31.mlp.experts.25.gate_proj", "model.layers.31.mlp.experts.26.gate_proj", "model.layers.31.mlp.experts.27.gate_proj", "model.layers.31.mlp.experts.28.gate_proj", "model.layers.31.mlp.experts.29.gate_proj", "model.layers.31.mlp.experts.30.gate_proj", "model.layers.31.mlp.experts.31.gate_proj", "model.layers.31.mlp.experts.32.gate_proj", "model.layers.31.mlp.experts.33.gate_proj", "model.layers.31.mlp.experts.34.gate_proj", "model.layers.31.mlp.experts.35.gate_proj", "model.layers.31.mlp.experts.36.gate_proj", "model.layers.31.mlp.experts.37.gate_proj", "model.layers.31.mlp.experts.38.gate_proj", "model.layers.31.mlp.experts.39.gate_proj", "model.layers.31.mlp.experts.40.gate_proj", "model.layers.31.mlp.experts.41.gate_proj", "model.layers.31.mlp.experts.42.gate_proj", "model.layers.31.mlp.experts.43.gate_proj", "model.layers.31.mlp.experts.44.gate_proj", "model.layers.31.mlp.experts.45.gate_proj", "model.layers.31.mlp.experts.46.gate_proj", "model.layers.31.mlp.experts.47.gate_proj", "model.layers.31.mlp.experts.48.gate_proj", "model.layers.31.mlp.experts.49.gate_proj", "model.layers.31.mlp.experts.50.gate_proj", "model.layers.31.mlp.experts.51.gate_proj", "model.layers.31.mlp.experts.52.gate_proj", "model.layers.31.mlp.experts.53.gate_proj", "model.layers.31.mlp.experts.54.gate_proj", "model.layers.31.mlp.experts.55.gate_proj", "model.layers.31.mlp.experts.56.gate_proj", "model.layers.31.mlp.experts.57.gate_proj", "model.layers.31.mlp.experts.58.gate_proj", "model.layers.31.mlp.experts.59.gate_proj", "model.layers.31.mlp.experts.60.gate_proj", "model.layers.31.mlp.experts.61.gate_proj", "model.layers.31.mlp.experts.62.gate_proj", "model.layers.31.mlp.experts.63.gate_proj", "model.layers.31.mlp.experts.64.gate_proj", "model.layers.31.mlp.experts.65.gate_proj", "model.layers.31.mlp.experts.66.gate_proj", "model.layers.31.mlp.experts.67.gate_proj", "model.layers.31.mlp.experts.68.gate_proj", "model.layers.31.mlp.experts.69.gate_proj", "model.layers.31.mlp.experts.70.gate_proj", "model.layers.31.mlp.experts.71.gate_proj", "model.layers.31.mlp.experts.72.gate_proj", "model.layers.31.mlp.experts.73.gate_proj", "model.layers.31.mlp.experts.74.gate_proj", "model.layers.31.mlp.experts.75.gate_proj", "model.layers.31.mlp.experts.76.gate_proj", "model.layers.31.mlp.experts.77.gate_proj", "model.layers.31.mlp.experts.78.gate_proj", "model.layers.31.mlp.experts.79.gate_proj", "model.layers.31.mlp.experts.80.gate_proj", "model.layers.31.mlp.experts.81.gate_proj", "model.layers.31.mlp.experts.82.gate_proj", "model.layers.31.mlp.experts.83.gate_proj", "model.layers.31.mlp.experts.84.gate_proj", "model.layers.31.mlp.experts.85.gate_proj", "model.layers.31.mlp.experts.86.gate_proj", "model.layers.31.mlp.experts.87.gate_proj", "model.layers.31.mlp.experts.88.gate_proj", "model.layers.31.mlp.experts.89.gate_proj", "model.layers.31.mlp.experts.90.gate_proj", "model.layers.31.mlp.experts.91.gate_proj", "model.layers.31.mlp.experts.92.gate_proj", "model.layers.31.mlp.experts.93.gate_proj", "model.layers.31.mlp.experts.94.gate_proj", "model.layers.31.mlp.experts.95.gate_proj", "model.layers.31.mlp.experts.96.gate_proj", "model.layers.31.mlp.experts.97.gate_proj", "model.layers.31.mlp.experts.98.gate_proj", "model.layers.31.mlp.experts.99.gate_proj", "model.layers.31.mlp.experts.100.gate_proj", "model.layers.31.mlp.experts.101.gate_proj", "model.layers.31.mlp.experts.102.gate_proj", "model.layers.31.mlp.experts.103.gate_proj", "model.layers.31.mlp.experts.104.gate_proj", "model.layers.31.mlp.experts.105.gate_proj", "model.layers.31.mlp.experts.106.gate_proj", "model.layers.31.mlp.experts.107.gate_proj", "model.layers.31.mlp.experts.108.gate_proj", "model.layers.31.mlp.experts.109.gate_proj", "model.layers.31.mlp.experts.110.gate_proj", "model.layers.31.mlp.experts.111.gate_proj", "model.layers.31.mlp.experts.112.gate_proj", "model.layers.31.mlp.experts.113.gate_proj", "model.layers.31.mlp.experts.114.gate_proj", "model.layers.31.mlp.experts.115.gate_proj", "model.layers.31.mlp.experts.116.gate_proj", "model.layers.31.mlp.experts.117.gate_proj", "model.layers.31.mlp.experts.118.gate_proj", "model.layers.31.mlp.experts.119.gate_proj", "model.layers.31.mlp.experts.120.gate_proj", "model.layers.31.mlp.experts.121.gate_proj", "model.layers.31.mlp.experts.122.gate_proj", "model.layers.31.mlp.experts.123.gate_proj", "model.layers.31.mlp.experts.124.gate_proj", "model.layers.31.mlp.experts.125.gate_proj", "model.layers.31.mlp.experts.126.gate_proj", "model.layers.31.mlp.experts.127.gate_proj", "model.layers.31.mlp.experts.128.gate_proj", "model.layers.31.mlp.experts.129.gate_proj", "model.layers.31.mlp.experts.130.gate_proj", "model.layers.31.mlp.experts.131.gate_proj", "model.layers.31.mlp.experts.132.gate_proj", "model.layers.31.mlp.experts.133.gate_proj", "model.layers.31.mlp.experts.134.gate_proj", "model.layers.31.mlp.experts.135.gate_proj", "model.layers.31.mlp.experts.136.gate_proj", "model.layers.31.mlp.experts.137.gate_proj", "model.layers.31.mlp.experts.138.gate_proj", "model.layers.31.mlp.experts.139.gate_proj", "model.layers.31.mlp.experts.140.gate_proj", "model.layers.31.mlp.experts.141.gate_proj", "model.layers.31.mlp.experts.142.gate_proj", "model.layers.31.mlp.experts.143.gate_proj", "model.layers.31.mlp.experts.144.gate_proj", "model.layers.31.mlp.experts.145.gate_proj", "model.layers.31.mlp.experts.146.gate_proj", "model.layers.31.mlp.experts.147.gate_proj", "model.layers.31.mlp.experts.148.gate_proj", "model.layers.31.mlp.experts.149.gate_proj", "model.layers.31.mlp.experts.150.gate_proj", "model.layers.31.mlp.experts.151.gate_proj", "model.layers.31.mlp.experts.152.gate_proj", "model.layers.31.mlp.experts.153.gate_proj", "model.layers.31.mlp.experts.154.gate_proj", "model.layers.31.mlp.experts.155.gate_proj", "model.layers.31.mlp.experts.156.gate_proj", "model.layers.31.mlp.experts.157.gate_proj", "model.layers.31.mlp.experts.158.gate_proj", "model.layers.31.mlp.experts.159.gate_proj", "model.layers.31.mlp.experts.0.up_proj", "model.layers.31.mlp.experts.1.up_proj", "model.layers.31.mlp.experts.2.up_proj", "model.layers.31.mlp.experts.3.up_proj", "model.layers.31.mlp.experts.4.up_proj", "model.layers.31.mlp.experts.5.up_proj", "model.layers.31.mlp.experts.6.up_proj", "model.layers.31.mlp.experts.7.up_proj", "model.layers.31.mlp.experts.8.up_proj", "model.layers.31.mlp.experts.9.up_proj", "model.layers.31.mlp.experts.10.up_proj", "model.layers.31.mlp.experts.11.up_proj", "model.layers.31.mlp.experts.12.up_proj", "model.layers.31.mlp.experts.13.up_proj", "model.layers.31.mlp.experts.14.up_proj", "model.layers.31.mlp.experts.15.up_proj", "model.layers.31.mlp.experts.16.up_proj", "model.layers.31.mlp.experts.17.up_proj", "model.layers.31.mlp.experts.18.up_proj", "model.layers.31.mlp.experts.19.up_proj", "model.layers.31.mlp.experts.20.up_proj", "model.layers.31.mlp.experts.21.up_proj", "model.layers.31.mlp.experts.22.up_proj", "model.layers.31.mlp.experts.23.up_proj", "model.layers.31.mlp.experts.24.up_proj", "model.layers.31.mlp.experts.25.up_proj", "model.layers.31.mlp.experts.26.up_proj", "model.layers.31.mlp.experts.27.up_proj", "model.layers.31.mlp.experts.28.up_proj", "model.layers.31.mlp.experts.29.up_proj", "model.layers.31.mlp.experts.30.up_proj", "model.layers.31.mlp.experts.31.up_proj", "model.layers.31.mlp.experts.32.up_proj", "model.layers.31.mlp.experts.33.up_proj", "model.layers.31.mlp.experts.34.up_proj", "model.layers.31.mlp.experts.35.up_proj", "model.layers.31.mlp.experts.36.up_proj", "model.layers.31.mlp.experts.37.up_proj", "model.layers.31.mlp.experts.38.up_proj", "model.layers.31.mlp.experts.39.up_proj", "model.layers.31.mlp.experts.40.up_proj", "model.layers.31.mlp.experts.41.up_proj", "model.layers.31.mlp.experts.42.up_proj", "model.layers.31.mlp.experts.43.up_proj", "model.layers.31.mlp.experts.44.up_proj", "model.layers.31.mlp.experts.45.up_proj", "model.layers.31.mlp.experts.46.up_proj", "model.layers.31.mlp.experts.47.up_proj", "model.layers.31.mlp.experts.48.up_proj", "model.layers.31.mlp.experts.49.up_proj", "model.layers.31.mlp.experts.50.up_proj", "model.layers.31.mlp.experts.51.up_proj", "model.layers.31.mlp.experts.52.up_proj", "model.layers.31.mlp.experts.53.up_proj", "model.layers.31.mlp.experts.54.up_proj", "model.layers.31.mlp.experts.55.up_proj", "model.layers.31.mlp.experts.56.up_proj", "model.layers.31.mlp.experts.57.up_proj", "model.layers.31.mlp.experts.58.up_proj", "model.layers.31.mlp.experts.59.up_proj", "model.layers.31.mlp.experts.60.up_proj", "model.layers.31.mlp.experts.61.up_proj", "model.layers.31.mlp.experts.62.up_proj", "model.layers.31.mlp.experts.63.up_proj", "model.layers.31.mlp.experts.64.up_proj", "model.layers.31.mlp.experts.65.up_proj", "model.layers.31.mlp.experts.66.up_proj", "model.layers.31.mlp.experts.67.up_proj", "model.layers.31.mlp.experts.68.up_proj", "model.layers.31.mlp.experts.69.up_proj", "model.layers.31.mlp.experts.70.up_proj", "model.layers.31.mlp.experts.71.up_proj", "model.layers.31.mlp.experts.72.up_proj", "model.layers.31.mlp.experts.73.up_proj", "model.layers.31.mlp.experts.74.up_proj", "model.layers.31.mlp.experts.75.up_proj", "model.layers.31.mlp.experts.76.up_proj", "model.layers.31.mlp.experts.77.up_proj", "model.layers.31.mlp.experts.78.up_proj", "model.layers.31.mlp.experts.79.up_proj", "model.layers.31.mlp.experts.80.up_proj", "model.layers.31.mlp.experts.81.up_proj", "model.layers.31.mlp.experts.82.up_proj", "model.layers.31.mlp.experts.83.up_proj", "model.layers.31.mlp.experts.84.up_proj", "model.layers.31.mlp.experts.85.up_proj", "model.layers.31.mlp.experts.86.up_proj", "model.layers.31.mlp.experts.87.up_proj", "model.layers.31.mlp.experts.88.up_proj", "model.layers.31.mlp.experts.89.up_proj", "model.layers.31.mlp.experts.90.up_proj", "model.layers.31.mlp.experts.91.up_proj", "model.layers.31.mlp.experts.92.up_proj", "model.layers.31.mlp.experts.93.up_proj", "model.layers.31.mlp.experts.94.up_proj", "model.layers.31.mlp.experts.95.up_proj", "model.layers.31.mlp.experts.96.up_proj", "model.layers.31.mlp.experts.97.up_proj", "model.layers.31.mlp.experts.98.up_proj", "model.layers.31.mlp.experts.99.up_proj", "model.layers.31.mlp.experts.100.up_proj", "model.layers.31.mlp.experts.101.up_proj", "model.layers.31.mlp.experts.102.up_proj", "model.layers.31.mlp.experts.103.up_proj", "model.layers.31.mlp.experts.104.up_proj", "model.layers.31.mlp.experts.105.up_proj", "model.layers.31.mlp.experts.106.up_proj", "model.layers.31.mlp.experts.107.up_proj", "model.layers.31.mlp.experts.108.up_proj", "model.layers.31.mlp.experts.109.up_proj", "model.layers.31.mlp.experts.110.up_proj", "model.layers.31.mlp.experts.111.up_proj", "model.layers.31.mlp.experts.112.up_proj", "model.layers.31.mlp.experts.113.up_proj", "model.layers.31.mlp.experts.114.up_proj", "model.layers.31.mlp.experts.115.up_proj", "model.layers.31.mlp.experts.116.up_proj", "model.layers.31.mlp.experts.117.up_proj", "model.layers.31.mlp.experts.118.up_proj", "model.layers.31.mlp.experts.119.up_proj", "model.layers.31.mlp.experts.120.up_proj", "model.layers.31.mlp.experts.121.up_proj", "model.layers.31.mlp.experts.122.up_proj", "model.layers.31.mlp.experts.123.up_proj", "model.layers.31.mlp.experts.124.up_proj", "model.layers.31.mlp.experts.125.up_proj", "model.layers.31.mlp.experts.126.up_proj", "model.layers.31.mlp.experts.127.up_proj", "model.layers.31.mlp.experts.128.up_proj", "model.layers.31.mlp.experts.129.up_proj", "model.layers.31.mlp.experts.130.up_proj", "model.layers.31.mlp.experts.131.up_proj", "model.layers.31.mlp.experts.132.up_proj", "model.layers.31.mlp.experts.133.up_proj", "model.layers.31.mlp.experts.134.up_proj", "model.layers.31.mlp.experts.135.up_proj", "model.layers.31.mlp.experts.136.up_proj", "model.layers.31.mlp.experts.137.up_proj", "model.layers.31.mlp.experts.138.up_proj", "model.layers.31.mlp.experts.139.up_proj", "model.layers.31.mlp.experts.140.up_proj", "model.layers.31.mlp.experts.141.up_proj", "model.layers.31.mlp.experts.142.up_proj", "model.layers.31.mlp.experts.143.up_proj", "model.layers.31.mlp.experts.144.up_proj", "model.layers.31.mlp.experts.145.up_proj", "model.layers.31.mlp.experts.146.up_proj", "model.layers.31.mlp.experts.147.up_proj", "model.layers.31.mlp.experts.148.up_proj", "model.layers.31.mlp.experts.149.up_proj", "model.layers.31.mlp.experts.150.up_proj", "model.layers.31.mlp.experts.151.up_proj", "model.layers.31.mlp.experts.152.up_proj", "model.layers.31.mlp.experts.153.up_proj", "model.layers.31.mlp.experts.154.up_proj", "model.layers.31.mlp.experts.155.up_proj", "model.layers.31.mlp.experts.156.up_proj", "model.layers.31.mlp.experts.157.up_proj", "model.layers.31.mlp.experts.158.up_proj", "model.layers.31.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -5.1151751540599866e-05, "dbits": 2516582400 }, { "dkld": -6.347668822854688e-05, "dbits": 5033164800 } ] }, { "idx": 188, "layers": [ "model.layers.31.mlp.experts.0.down_proj", "model.layers.31.mlp.experts.1.down_proj", "model.layers.31.mlp.experts.2.down_proj", "model.layers.31.mlp.experts.3.down_proj", "model.layers.31.mlp.experts.4.down_proj", "model.layers.31.mlp.experts.5.down_proj", "model.layers.31.mlp.experts.6.down_proj", "model.layers.31.mlp.experts.7.down_proj", "model.layers.31.mlp.experts.8.down_proj", "model.layers.31.mlp.experts.9.down_proj", "model.layers.31.mlp.experts.10.down_proj", "model.layers.31.mlp.experts.11.down_proj", "model.layers.31.mlp.experts.12.down_proj", "model.layers.31.mlp.experts.13.down_proj", "model.layers.31.mlp.experts.14.down_proj", "model.layers.31.mlp.experts.15.down_proj", "model.layers.31.mlp.experts.16.down_proj", "model.layers.31.mlp.experts.17.down_proj", "model.layers.31.mlp.experts.18.down_proj", "model.layers.31.mlp.experts.19.down_proj", "model.layers.31.mlp.experts.20.down_proj", "model.layers.31.mlp.experts.21.down_proj", "model.layers.31.mlp.experts.22.down_proj", "model.layers.31.mlp.experts.23.down_proj", "model.layers.31.mlp.experts.24.down_proj", "model.layers.31.mlp.experts.25.down_proj", "model.layers.31.mlp.experts.26.down_proj", "model.layers.31.mlp.experts.27.down_proj", "model.layers.31.mlp.experts.28.down_proj", "model.layers.31.mlp.experts.29.down_proj", "model.layers.31.mlp.experts.30.down_proj", "model.layers.31.mlp.experts.31.down_proj", "model.layers.31.mlp.experts.32.down_proj", "model.layers.31.mlp.experts.33.down_proj", "model.layers.31.mlp.experts.34.down_proj", "model.layers.31.mlp.experts.35.down_proj", "model.layers.31.mlp.experts.36.down_proj", "model.layers.31.mlp.experts.37.down_proj", "model.layers.31.mlp.experts.38.down_proj", "model.layers.31.mlp.experts.39.down_proj", "model.layers.31.mlp.experts.40.down_proj", "model.layers.31.mlp.experts.41.down_proj", "model.layers.31.mlp.experts.42.down_proj", "model.layers.31.mlp.experts.43.down_proj", "model.layers.31.mlp.experts.44.down_proj", "model.layers.31.mlp.experts.45.down_proj", "model.layers.31.mlp.experts.46.down_proj", "model.layers.31.mlp.experts.47.down_proj", "model.layers.31.mlp.experts.48.down_proj", "model.layers.31.mlp.experts.49.down_proj", "model.layers.31.mlp.experts.50.down_proj", "model.layers.31.mlp.experts.51.down_proj", "model.layers.31.mlp.experts.52.down_proj", "model.layers.31.mlp.experts.53.down_proj", "model.layers.31.mlp.experts.54.down_proj", "model.layers.31.mlp.experts.55.down_proj", "model.layers.31.mlp.experts.56.down_proj", "model.layers.31.mlp.experts.57.down_proj", "model.layers.31.mlp.experts.58.down_proj", "model.layers.31.mlp.experts.59.down_proj", "model.layers.31.mlp.experts.60.down_proj", "model.layers.31.mlp.experts.61.down_proj", "model.layers.31.mlp.experts.62.down_proj", "model.layers.31.mlp.experts.63.down_proj", "model.layers.31.mlp.experts.64.down_proj", "model.layers.31.mlp.experts.65.down_proj", "model.layers.31.mlp.experts.66.down_proj", "model.layers.31.mlp.experts.67.down_proj", "model.layers.31.mlp.experts.68.down_proj", "model.layers.31.mlp.experts.69.down_proj", "model.layers.31.mlp.experts.70.down_proj", "model.layers.31.mlp.experts.71.down_proj", "model.layers.31.mlp.experts.72.down_proj", "model.layers.31.mlp.experts.73.down_proj", "model.layers.31.mlp.experts.74.down_proj", "model.layers.31.mlp.experts.75.down_proj", "model.layers.31.mlp.experts.76.down_proj", "model.layers.31.mlp.experts.77.down_proj", "model.layers.31.mlp.experts.78.down_proj", "model.layers.31.mlp.experts.79.down_proj", "model.layers.31.mlp.experts.80.down_proj", "model.layers.31.mlp.experts.81.down_proj", "model.layers.31.mlp.experts.82.down_proj", "model.layers.31.mlp.experts.83.down_proj", "model.layers.31.mlp.experts.84.down_proj", "model.layers.31.mlp.experts.85.down_proj", "model.layers.31.mlp.experts.86.down_proj", "model.layers.31.mlp.experts.87.down_proj", "model.layers.31.mlp.experts.88.down_proj", "model.layers.31.mlp.experts.89.down_proj", "model.layers.31.mlp.experts.90.down_proj", "model.layers.31.mlp.experts.91.down_proj", "model.layers.31.mlp.experts.92.down_proj", "model.layers.31.mlp.experts.93.down_proj", "model.layers.31.mlp.experts.94.down_proj", "model.layers.31.mlp.experts.95.down_proj", "model.layers.31.mlp.experts.96.down_proj", "model.layers.31.mlp.experts.97.down_proj", "model.layers.31.mlp.experts.98.down_proj", "model.layers.31.mlp.experts.99.down_proj", "model.layers.31.mlp.experts.100.down_proj", "model.layers.31.mlp.experts.101.down_proj", "model.layers.31.mlp.experts.102.down_proj", "model.layers.31.mlp.experts.103.down_proj", "model.layers.31.mlp.experts.104.down_proj", "model.layers.31.mlp.experts.105.down_proj", "model.layers.31.mlp.experts.106.down_proj", "model.layers.31.mlp.experts.107.down_proj", "model.layers.31.mlp.experts.108.down_proj", "model.layers.31.mlp.experts.109.down_proj", "model.layers.31.mlp.experts.110.down_proj", "model.layers.31.mlp.experts.111.down_proj", "model.layers.31.mlp.experts.112.down_proj", "model.layers.31.mlp.experts.113.down_proj", "model.layers.31.mlp.experts.114.down_proj", "model.layers.31.mlp.experts.115.down_proj", "model.layers.31.mlp.experts.116.down_proj", "model.layers.31.mlp.experts.117.down_proj", "model.layers.31.mlp.experts.118.down_proj", "model.layers.31.mlp.experts.119.down_proj", "model.layers.31.mlp.experts.120.down_proj", "model.layers.31.mlp.experts.121.down_proj", "model.layers.31.mlp.experts.122.down_proj", "model.layers.31.mlp.experts.123.down_proj", "model.layers.31.mlp.experts.124.down_proj", "model.layers.31.mlp.experts.125.down_proj", "model.layers.31.mlp.experts.126.down_proj", "model.layers.31.mlp.experts.127.down_proj", "model.layers.31.mlp.experts.128.down_proj", "model.layers.31.mlp.experts.129.down_proj", "model.layers.31.mlp.experts.130.down_proj", "model.layers.31.mlp.experts.131.down_proj", "model.layers.31.mlp.experts.132.down_proj", "model.layers.31.mlp.experts.133.down_proj", "model.layers.31.mlp.experts.134.down_proj", "model.layers.31.mlp.experts.135.down_proj", "model.layers.31.mlp.experts.136.down_proj", "model.layers.31.mlp.experts.137.down_proj", "model.layers.31.mlp.experts.138.down_proj", "model.layers.31.mlp.experts.139.down_proj", "model.layers.31.mlp.experts.140.down_proj", "model.layers.31.mlp.experts.141.down_proj", "model.layers.31.mlp.experts.142.down_proj", "model.layers.31.mlp.experts.143.down_proj", "model.layers.31.mlp.experts.144.down_proj", "model.layers.31.mlp.experts.145.down_proj", "model.layers.31.mlp.experts.146.down_proj", "model.layers.31.mlp.experts.147.down_proj", "model.layers.31.mlp.experts.148.down_proj", "model.layers.31.mlp.experts.149.down_proj", "model.layers.31.mlp.experts.150.down_proj", "model.layers.31.mlp.experts.151.down_proj", "model.layers.31.mlp.experts.152.down_proj", "model.layers.31.mlp.experts.153.down_proj", "model.layers.31.mlp.experts.154.down_proj", "model.layers.31.mlp.experts.155.down_proj", "model.layers.31.mlp.experts.156.down_proj", "model.layers.31.mlp.experts.157.down_proj", "model.layers.31.mlp.experts.158.down_proj", "model.layers.31.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -8.489980828016962e-05, "dbits": 1258291200 }, { "dkld": -8.60309461131678e-05, "dbits": 2516582400 } ] }, { "idx": 189, "layers": [ "model.layers.32.self_attn.q_proj" ], "candidates": [ { "dkld": 1.864419318735669e-05, "dbits": 62914560 }, { "dkld": -8.284922223538056e-05, "dbits": 125829120 } ] }, { "idx": 190, "layers": [ "model.layers.32.self_attn.k_proj", "model.layers.32.self_attn.v_proj" ], "candidates": [ { "dkld": 6.63525192067041e-05, "dbits": 10485760 }, { "dkld": -5.734153091900562e-07, "dbits": 20971520 } ] }, { "idx": 191, "layers": [ "model.layers.32.self_attn.o_proj" ], "candidates": [ { "dkld": 0.00011502667330205545, "dbits": 62914560 }, { "dkld": 0.00013249837793409894, "dbits": 125829120 } ] }, { "idx": 192, "layers": [ "model.layers.32.mlp.shared_experts.gate_proj", "model.layers.32.mlp.shared_experts.up_proj", "model.layers.32.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -2.068942412733997e-05, "dbits": 23592960 }, { "dkld": -0.00013404889032244544, "dbits": 47185920 } ] }, { "idx": 193, "layers": [ "model.layers.32.mlp.experts.0.gate_proj", "model.layers.32.mlp.experts.1.gate_proj", "model.layers.32.mlp.experts.2.gate_proj", "model.layers.32.mlp.experts.3.gate_proj", "model.layers.32.mlp.experts.4.gate_proj", "model.layers.32.mlp.experts.5.gate_proj", "model.layers.32.mlp.experts.6.gate_proj", "model.layers.32.mlp.experts.7.gate_proj", "model.layers.32.mlp.experts.8.gate_proj", "model.layers.32.mlp.experts.9.gate_proj", "model.layers.32.mlp.experts.10.gate_proj", "model.layers.32.mlp.experts.11.gate_proj", "model.layers.32.mlp.experts.12.gate_proj", "model.layers.32.mlp.experts.13.gate_proj", "model.layers.32.mlp.experts.14.gate_proj", "model.layers.32.mlp.experts.15.gate_proj", "model.layers.32.mlp.experts.16.gate_proj", "model.layers.32.mlp.experts.17.gate_proj", "model.layers.32.mlp.experts.18.gate_proj", "model.layers.32.mlp.experts.19.gate_proj", "model.layers.32.mlp.experts.20.gate_proj", "model.layers.32.mlp.experts.21.gate_proj", "model.layers.32.mlp.experts.22.gate_proj", "model.layers.32.mlp.experts.23.gate_proj", "model.layers.32.mlp.experts.24.gate_proj", "model.layers.32.mlp.experts.25.gate_proj", "model.layers.32.mlp.experts.26.gate_proj", "model.layers.32.mlp.experts.27.gate_proj", "model.layers.32.mlp.experts.28.gate_proj", "model.layers.32.mlp.experts.29.gate_proj", "model.layers.32.mlp.experts.30.gate_proj", "model.layers.32.mlp.experts.31.gate_proj", "model.layers.32.mlp.experts.32.gate_proj", "model.layers.32.mlp.experts.33.gate_proj", "model.layers.32.mlp.experts.34.gate_proj", "model.layers.32.mlp.experts.35.gate_proj", "model.layers.32.mlp.experts.36.gate_proj", "model.layers.32.mlp.experts.37.gate_proj", "model.layers.32.mlp.experts.38.gate_proj", "model.layers.32.mlp.experts.39.gate_proj", "model.layers.32.mlp.experts.40.gate_proj", "model.layers.32.mlp.experts.41.gate_proj", "model.layers.32.mlp.experts.42.gate_proj", "model.layers.32.mlp.experts.43.gate_proj", "model.layers.32.mlp.experts.44.gate_proj", "model.layers.32.mlp.experts.45.gate_proj", "model.layers.32.mlp.experts.46.gate_proj", "model.layers.32.mlp.experts.47.gate_proj", "model.layers.32.mlp.experts.48.gate_proj", "model.layers.32.mlp.experts.49.gate_proj", "model.layers.32.mlp.experts.50.gate_proj", "model.layers.32.mlp.experts.51.gate_proj", "model.layers.32.mlp.experts.52.gate_proj", "model.layers.32.mlp.experts.53.gate_proj", "model.layers.32.mlp.experts.54.gate_proj", "model.layers.32.mlp.experts.55.gate_proj", "model.layers.32.mlp.experts.56.gate_proj", "model.layers.32.mlp.experts.57.gate_proj", "model.layers.32.mlp.experts.58.gate_proj", "model.layers.32.mlp.experts.59.gate_proj", "model.layers.32.mlp.experts.60.gate_proj", "model.layers.32.mlp.experts.61.gate_proj", "model.layers.32.mlp.experts.62.gate_proj", "model.layers.32.mlp.experts.63.gate_proj", "model.layers.32.mlp.experts.64.gate_proj", "model.layers.32.mlp.experts.65.gate_proj", "model.layers.32.mlp.experts.66.gate_proj", "model.layers.32.mlp.experts.67.gate_proj", "model.layers.32.mlp.experts.68.gate_proj", "model.layers.32.mlp.experts.69.gate_proj", "model.layers.32.mlp.experts.70.gate_proj", "model.layers.32.mlp.experts.71.gate_proj", "model.layers.32.mlp.experts.72.gate_proj", "model.layers.32.mlp.experts.73.gate_proj", "model.layers.32.mlp.experts.74.gate_proj", "model.layers.32.mlp.experts.75.gate_proj", "model.layers.32.mlp.experts.76.gate_proj", "model.layers.32.mlp.experts.77.gate_proj", "model.layers.32.mlp.experts.78.gate_proj", "model.layers.32.mlp.experts.79.gate_proj", "model.layers.32.mlp.experts.80.gate_proj", "model.layers.32.mlp.experts.81.gate_proj", "model.layers.32.mlp.experts.82.gate_proj", "model.layers.32.mlp.experts.83.gate_proj", "model.layers.32.mlp.experts.84.gate_proj", "model.layers.32.mlp.experts.85.gate_proj", "model.layers.32.mlp.experts.86.gate_proj", "model.layers.32.mlp.experts.87.gate_proj", "model.layers.32.mlp.experts.88.gate_proj", "model.layers.32.mlp.experts.89.gate_proj", "model.layers.32.mlp.experts.90.gate_proj", "model.layers.32.mlp.experts.91.gate_proj", "model.layers.32.mlp.experts.92.gate_proj", "model.layers.32.mlp.experts.93.gate_proj", "model.layers.32.mlp.experts.94.gate_proj", "model.layers.32.mlp.experts.95.gate_proj", "model.layers.32.mlp.experts.96.gate_proj", "model.layers.32.mlp.experts.97.gate_proj", "model.layers.32.mlp.experts.98.gate_proj", "model.layers.32.mlp.experts.99.gate_proj", "model.layers.32.mlp.experts.100.gate_proj", "model.layers.32.mlp.experts.101.gate_proj", "model.layers.32.mlp.experts.102.gate_proj", "model.layers.32.mlp.experts.103.gate_proj", "model.layers.32.mlp.experts.104.gate_proj", "model.layers.32.mlp.experts.105.gate_proj", "model.layers.32.mlp.experts.106.gate_proj", "model.layers.32.mlp.experts.107.gate_proj", "model.layers.32.mlp.experts.108.gate_proj", "model.layers.32.mlp.experts.109.gate_proj", "model.layers.32.mlp.experts.110.gate_proj", "model.layers.32.mlp.experts.111.gate_proj", "model.layers.32.mlp.experts.112.gate_proj", "model.layers.32.mlp.experts.113.gate_proj", "model.layers.32.mlp.experts.114.gate_proj", "model.layers.32.mlp.experts.115.gate_proj", "model.layers.32.mlp.experts.116.gate_proj", "model.layers.32.mlp.experts.117.gate_proj", "model.layers.32.mlp.experts.118.gate_proj", "model.layers.32.mlp.experts.119.gate_proj", "model.layers.32.mlp.experts.120.gate_proj", "model.layers.32.mlp.experts.121.gate_proj", "model.layers.32.mlp.experts.122.gate_proj", "model.layers.32.mlp.experts.123.gate_proj", "model.layers.32.mlp.experts.124.gate_proj", "model.layers.32.mlp.experts.125.gate_proj", "model.layers.32.mlp.experts.126.gate_proj", "model.layers.32.mlp.experts.127.gate_proj", "model.layers.32.mlp.experts.128.gate_proj", "model.layers.32.mlp.experts.129.gate_proj", "model.layers.32.mlp.experts.130.gate_proj", "model.layers.32.mlp.experts.131.gate_proj", "model.layers.32.mlp.experts.132.gate_proj", "model.layers.32.mlp.experts.133.gate_proj", "model.layers.32.mlp.experts.134.gate_proj", "model.layers.32.mlp.experts.135.gate_proj", "model.layers.32.mlp.experts.136.gate_proj", "model.layers.32.mlp.experts.137.gate_proj", "model.layers.32.mlp.experts.138.gate_proj", "model.layers.32.mlp.experts.139.gate_proj", "model.layers.32.mlp.experts.140.gate_proj", "model.layers.32.mlp.experts.141.gate_proj", "model.layers.32.mlp.experts.142.gate_proj", "model.layers.32.mlp.experts.143.gate_proj", "model.layers.32.mlp.experts.144.gate_proj", "model.layers.32.mlp.experts.145.gate_proj", "model.layers.32.mlp.experts.146.gate_proj", "model.layers.32.mlp.experts.147.gate_proj", "model.layers.32.mlp.experts.148.gate_proj", "model.layers.32.mlp.experts.149.gate_proj", "model.layers.32.mlp.experts.150.gate_proj", "model.layers.32.mlp.experts.151.gate_proj", "model.layers.32.mlp.experts.152.gate_proj", "model.layers.32.mlp.experts.153.gate_proj", "model.layers.32.mlp.experts.154.gate_proj", "model.layers.32.mlp.experts.155.gate_proj", "model.layers.32.mlp.experts.156.gate_proj", "model.layers.32.mlp.experts.157.gate_proj", "model.layers.32.mlp.experts.158.gate_proj", "model.layers.32.mlp.experts.159.gate_proj", "model.layers.32.mlp.experts.0.up_proj", "model.layers.32.mlp.experts.1.up_proj", "model.layers.32.mlp.experts.2.up_proj", "model.layers.32.mlp.experts.3.up_proj", "model.layers.32.mlp.experts.4.up_proj", "model.layers.32.mlp.experts.5.up_proj", "model.layers.32.mlp.experts.6.up_proj", "model.layers.32.mlp.experts.7.up_proj", "model.layers.32.mlp.experts.8.up_proj", "model.layers.32.mlp.experts.9.up_proj", "model.layers.32.mlp.experts.10.up_proj", "model.layers.32.mlp.experts.11.up_proj", "model.layers.32.mlp.experts.12.up_proj", "model.layers.32.mlp.experts.13.up_proj", "model.layers.32.mlp.experts.14.up_proj", "model.layers.32.mlp.experts.15.up_proj", "model.layers.32.mlp.experts.16.up_proj", "model.layers.32.mlp.experts.17.up_proj", "model.layers.32.mlp.experts.18.up_proj", "model.layers.32.mlp.experts.19.up_proj", "model.layers.32.mlp.experts.20.up_proj", "model.layers.32.mlp.experts.21.up_proj", "model.layers.32.mlp.experts.22.up_proj", "model.layers.32.mlp.experts.23.up_proj", "model.layers.32.mlp.experts.24.up_proj", "model.layers.32.mlp.experts.25.up_proj", "model.layers.32.mlp.experts.26.up_proj", "model.layers.32.mlp.experts.27.up_proj", "model.layers.32.mlp.experts.28.up_proj", "model.layers.32.mlp.experts.29.up_proj", "model.layers.32.mlp.experts.30.up_proj", "model.layers.32.mlp.experts.31.up_proj", "model.layers.32.mlp.experts.32.up_proj", "model.layers.32.mlp.experts.33.up_proj", "model.layers.32.mlp.experts.34.up_proj", "model.layers.32.mlp.experts.35.up_proj", "model.layers.32.mlp.experts.36.up_proj", "model.layers.32.mlp.experts.37.up_proj", "model.layers.32.mlp.experts.38.up_proj", "model.layers.32.mlp.experts.39.up_proj", "model.layers.32.mlp.experts.40.up_proj", "model.layers.32.mlp.experts.41.up_proj", "model.layers.32.mlp.experts.42.up_proj", "model.layers.32.mlp.experts.43.up_proj", "model.layers.32.mlp.experts.44.up_proj", "model.layers.32.mlp.experts.45.up_proj", "model.layers.32.mlp.experts.46.up_proj", "model.layers.32.mlp.experts.47.up_proj", "model.layers.32.mlp.experts.48.up_proj", "model.layers.32.mlp.experts.49.up_proj", "model.layers.32.mlp.experts.50.up_proj", "model.layers.32.mlp.experts.51.up_proj", "model.layers.32.mlp.experts.52.up_proj", "model.layers.32.mlp.experts.53.up_proj", "model.layers.32.mlp.experts.54.up_proj", "model.layers.32.mlp.experts.55.up_proj", "model.layers.32.mlp.experts.56.up_proj", "model.layers.32.mlp.experts.57.up_proj", "model.layers.32.mlp.experts.58.up_proj", "model.layers.32.mlp.experts.59.up_proj", "model.layers.32.mlp.experts.60.up_proj", "model.layers.32.mlp.experts.61.up_proj", "model.layers.32.mlp.experts.62.up_proj", "model.layers.32.mlp.experts.63.up_proj", "model.layers.32.mlp.experts.64.up_proj", "model.layers.32.mlp.experts.65.up_proj", "model.layers.32.mlp.experts.66.up_proj", "model.layers.32.mlp.experts.67.up_proj", "model.layers.32.mlp.experts.68.up_proj", "model.layers.32.mlp.experts.69.up_proj", "model.layers.32.mlp.experts.70.up_proj", "model.layers.32.mlp.experts.71.up_proj", "model.layers.32.mlp.experts.72.up_proj", "model.layers.32.mlp.experts.73.up_proj", "model.layers.32.mlp.experts.74.up_proj", "model.layers.32.mlp.experts.75.up_proj", "model.layers.32.mlp.experts.76.up_proj", "model.layers.32.mlp.experts.77.up_proj", "model.layers.32.mlp.experts.78.up_proj", "model.layers.32.mlp.experts.79.up_proj", "model.layers.32.mlp.experts.80.up_proj", "model.layers.32.mlp.experts.81.up_proj", "model.layers.32.mlp.experts.82.up_proj", "model.layers.32.mlp.experts.83.up_proj", "model.layers.32.mlp.experts.84.up_proj", "model.layers.32.mlp.experts.85.up_proj", "model.layers.32.mlp.experts.86.up_proj", "model.layers.32.mlp.experts.87.up_proj", "model.layers.32.mlp.experts.88.up_proj", "model.layers.32.mlp.experts.89.up_proj", "model.layers.32.mlp.experts.90.up_proj", "model.layers.32.mlp.experts.91.up_proj", "model.layers.32.mlp.experts.92.up_proj", "model.layers.32.mlp.experts.93.up_proj", "model.layers.32.mlp.experts.94.up_proj", "model.layers.32.mlp.experts.95.up_proj", "model.layers.32.mlp.experts.96.up_proj", "model.layers.32.mlp.experts.97.up_proj", "model.layers.32.mlp.experts.98.up_proj", "model.layers.32.mlp.experts.99.up_proj", "model.layers.32.mlp.experts.100.up_proj", "model.layers.32.mlp.experts.101.up_proj", "model.layers.32.mlp.experts.102.up_proj", "model.layers.32.mlp.experts.103.up_proj", "model.layers.32.mlp.experts.104.up_proj", "model.layers.32.mlp.experts.105.up_proj", "model.layers.32.mlp.experts.106.up_proj", "model.layers.32.mlp.experts.107.up_proj", "model.layers.32.mlp.experts.108.up_proj", "model.layers.32.mlp.experts.109.up_proj", "model.layers.32.mlp.experts.110.up_proj", "model.layers.32.mlp.experts.111.up_proj", "model.layers.32.mlp.experts.112.up_proj", "model.layers.32.mlp.experts.113.up_proj", "model.layers.32.mlp.experts.114.up_proj", "model.layers.32.mlp.experts.115.up_proj", "model.layers.32.mlp.experts.116.up_proj", "model.layers.32.mlp.experts.117.up_proj", "model.layers.32.mlp.experts.118.up_proj", "model.layers.32.mlp.experts.119.up_proj", "model.layers.32.mlp.experts.120.up_proj", "model.layers.32.mlp.experts.121.up_proj", "model.layers.32.mlp.experts.122.up_proj", "model.layers.32.mlp.experts.123.up_proj", "model.layers.32.mlp.experts.124.up_proj", "model.layers.32.mlp.experts.125.up_proj", "model.layers.32.mlp.experts.126.up_proj", "model.layers.32.mlp.experts.127.up_proj", "model.layers.32.mlp.experts.128.up_proj", "model.layers.32.mlp.experts.129.up_proj", "model.layers.32.mlp.experts.130.up_proj", "model.layers.32.mlp.experts.131.up_proj", "model.layers.32.mlp.experts.132.up_proj", "model.layers.32.mlp.experts.133.up_proj", "model.layers.32.mlp.experts.134.up_proj", "model.layers.32.mlp.experts.135.up_proj", "model.layers.32.mlp.experts.136.up_proj", "model.layers.32.mlp.experts.137.up_proj", "model.layers.32.mlp.experts.138.up_proj", "model.layers.32.mlp.experts.139.up_proj", "model.layers.32.mlp.experts.140.up_proj", "model.layers.32.mlp.experts.141.up_proj", "model.layers.32.mlp.experts.142.up_proj", "model.layers.32.mlp.experts.143.up_proj", "model.layers.32.mlp.experts.144.up_proj", "model.layers.32.mlp.experts.145.up_proj", "model.layers.32.mlp.experts.146.up_proj", "model.layers.32.mlp.experts.147.up_proj", "model.layers.32.mlp.experts.148.up_proj", "model.layers.32.mlp.experts.149.up_proj", "model.layers.32.mlp.experts.150.up_proj", "model.layers.32.mlp.experts.151.up_proj", "model.layers.32.mlp.experts.152.up_proj", "model.layers.32.mlp.experts.153.up_proj", "model.layers.32.mlp.experts.154.up_proj", "model.layers.32.mlp.experts.155.up_proj", "model.layers.32.mlp.experts.156.up_proj", "model.layers.32.mlp.experts.157.up_proj", "model.layers.32.mlp.experts.158.up_proj", "model.layers.32.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -5.406634882092372e-05, "dbits": 2516582400 }, { "dkld": -6.945603527128662e-05, "dbits": 5033164800 } ] }, { "idx": 194, "layers": [ "model.layers.32.mlp.experts.0.down_proj", "model.layers.32.mlp.experts.1.down_proj", "model.layers.32.mlp.experts.2.down_proj", "model.layers.32.mlp.experts.3.down_proj", "model.layers.32.mlp.experts.4.down_proj", "model.layers.32.mlp.experts.5.down_proj", "model.layers.32.mlp.experts.6.down_proj", "model.layers.32.mlp.experts.7.down_proj", "model.layers.32.mlp.experts.8.down_proj", "model.layers.32.mlp.experts.9.down_proj", "model.layers.32.mlp.experts.10.down_proj", "model.layers.32.mlp.experts.11.down_proj", "model.layers.32.mlp.experts.12.down_proj", "model.layers.32.mlp.experts.13.down_proj", "model.layers.32.mlp.experts.14.down_proj", "model.layers.32.mlp.experts.15.down_proj", "model.layers.32.mlp.experts.16.down_proj", "model.layers.32.mlp.experts.17.down_proj", "model.layers.32.mlp.experts.18.down_proj", "model.layers.32.mlp.experts.19.down_proj", "model.layers.32.mlp.experts.20.down_proj", "model.layers.32.mlp.experts.21.down_proj", "model.layers.32.mlp.experts.22.down_proj", "model.layers.32.mlp.experts.23.down_proj", "model.layers.32.mlp.experts.24.down_proj", "model.layers.32.mlp.experts.25.down_proj", "model.layers.32.mlp.experts.26.down_proj", "model.layers.32.mlp.experts.27.down_proj", "model.layers.32.mlp.experts.28.down_proj", "model.layers.32.mlp.experts.29.down_proj", "model.layers.32.mlp.experts.30.down_proj", "model.layers.32.mlp.experts.31.down_proj", "model.layers.32.mlp.experts.32.down_proj", "model.layers.32.mlp.experts.33.down_proj", "model.layers.32.mlp.experts.34.down_proj", "model.layers.32.mlp.experts.35.down_proj", "model.layers.32.mlp.experts.36.down_proj", "model.layers.32.mlp.experts.37.down_proj", "model.layers.32.mlp.experts.38.down_proj", "model.layers.32.mlp.experts.39.down_proj", "model.layers.32.mlp.experts.40.down_proj", "model.layers.32.mlp.experts.41.down_proj", "model.layers.32.mlp.experts.42.down_proj", "model.layers.32.mlp.experts.43.down_proj", "model.layers.32.mlp.experts.44.down_proj", "model.layers.32.mlp.experts.45.down_proj", "model.layers.32.mlp.experts.46.down_proj", "model.layers.32.mlp.experts.47.down_proj", "model.layers.32.mlp.experts.48.down_proj", "model.layers.32.mlp.experts.49.down_proj", "model.layers.32.mlp.experts.50.down_proj", "model.layers.32.mlp.experts.51.down_proj", "model.layers.32.mlp.experts.52.down_proj", "model.layers.32.mlp.experts.53.down_proj", "model.layers.32.mlp.experts.54.down_proj", "model.layers.32.mlp.experts.55.down_proj", "model.layers.32.mlp.experts.56.down_proj", "model.layers.32.mlp.experts.57.down_proj", "model.layers.32.mlp.experts.58.down_proj", "model.layers.32.mlp.experts.59.down_proj", "model.layers.32.mlp.experts.60.down_proj", "model.layers.32.mlp.experts.61.down_proj", "model.layers.32.mlp.experts.62.down_proj", "model.layers.32.mlp.experts.63.down_proj", "model.layers.32.mlp.experts.64.down_proj", "model.layers.32.mlp.experts.65.down_proj", "model.layers.32.mlp.experts.66.down_proj", "model.layers.32.mlp.experts.67.down_proj", "model.layers.32.mlp.experts.68.down_proj", "model.layers.32.mlp.experts.69.down_proj", "model.layers.32.mlp.experts.70.down_proj", "model.layers.32.mlp.experts.71.down_proj", "model.layers.32.mlp.experts.72.down_proj", "model.layers.32.mlp.experts.73.down_proj", "model.layers.32.mlp.experts.74.down_proj", "model.layers.32.mlp.experts.75.down_proj", "model.layers.32.mlp.experts.76.down_proj", "model.layers.32.mlp.experts.77.down_proj", "model.layers.32.mlp.experts.78.down_proj", "model.layers.32.mlp.experts.79.down_proj", "model.layers.32.mlp.experts.80.down_proj", "model.layers.32.mlp.experts.81.down_proj", "model.layers.32.mlp.experts.82.down_proj", "model.layers.32.mlp.experts.83.down_proj", "model.layers.32.mlp.experts.84.down_proj", "model.layers.32.mlp.experts.85.down_proj", "model.layers.32.mlp.experts.86.down_proj", "model.layers.32.mlp.experts.87.down_proj", "model.layers.32.mlp.experts.88.down_proj", "model.layers.32.mlp.experts.89.down_proj", "model.layers.32.mlp.experts.90.down_proj", "model.layers.32.mlp.experts.91.down_proj", "model.layers.32.mlp.experts.92.down_proj", "model.layers.32.mlp.experts.93.down_proj", "model.layers.32.mlp.experts.94.down_proj", "model.layers.32.mlp.experts.95.down_proj", "model.layers.32.mlp.experts.96.down_proj", "model.layers.32.mlp.experts.97.down_proj", "model.layers.32.mlp.experts.98.down_proj", "model.layers.32.mlp.experts.99.down_proj", "model.layers.32.mlp.experts.100.down_proj", "model.layers.32.mlp.experts.101.down_proj", "model.layers.32.mlp.experts.102.down_proj", "model.layers.32.mlp.experts.103.down_proj", "model.layers.32.mlp.experts.104.down_proj", "model.layers.32.mlp.experts.105.down_proj", "model.layers.32.mlp.experts.106.down_proj", "model.layers.32.mlp.experts.107.down_proj", "model.layers.32.mlp.experts.108.down_proj", "model.layers.32.mlp.experts.109.down_proj", "model.layers.32.mlp.experts.110.down_proj", "model.layers.32.mlp.experts.111.down_proj", "model.layers.32.mlp.experts.112.down_proj", "model.layers.32.mlp.experts.113.down_proj", "model.layers.32.mlp.experts.114.down_proj", "model.layers.32.mlp.experts.115.down_proj", "model.layers.32.mlp.experts.116.down_proj", "model.layers.32.mlp.experts.117.down_proj", "model.layers.32.mlp.experts.118.down_proj", "model.layers.32.mlp.experts.119.down_proj", "model.layers.32.mlp.experts.120.down_proj", "model.layers.32.mlp.experts.121.down_proj", "model.layers.32.mlp.experts.122.down_proj", "model.layers.32.mlp.experts.123.down_proj", "model.layers.32.mlp.experts.124.down_proj", "model.layers.32.mlp.experts.125.down_proj", "model.layers.32.mlp.experts.126.down_proj", "model.layers.32.mlp.experts.127.down_proj", "model.layers.32.mlp.experts.128.down_proj", "model.layers.32.mlp.experts.129.down_proj", "model.layers.32.mlp.experts.130.down_proj", "model.layers.32.mlp.experts.131.down_proj", "model.layers.32.mlp.experts.132.down_proj", "model.layers.32.mlp.experts.133.down_proj", "model.layers.32.mlp.experts.134.down_proj", "model.layers.32.mlp.experts.135.down_proj", "model.layers.32.mlp.experts.136.down_proj", "model.layers.32.mlp.experts.137.down_proj", "model.layers.32.mlp.experts.138.down_proj", "model.layers.32.mlp.experts.139.down_proj", "model.layers.32.mlp.experts.140.down_proj", "model.layers.32.mlp.experts.141.down_proj", "model.layers.32.mlp.experts.142.down_proj", "model.layers.32.mlp.experts.143.down_proj", "model.layers.32.mlp.experts.144.down_proj", "model.layers.32.mlp.experts.145.down_proj", "model.layers.32.mlp.experts.146.down_proj", "model.layers.32.mlp.experts.147.down_proj", "model.layers.32.mlp.experts.148.down_proj", "model.layers.32.mlp.experts.149.down_proj", "model.layers.32.mlp.experts.150.down_proj", "model.layers.32.mlp.experts.151.down_proj", "model.layers.32.mlp.experts.152.down_proj", "model.layers.32.mlp.experts.153.down_proj", "model.layers.32.mlp.experts.154.down_proj", "model.layers.32.mlp.experts.155.down_proj", "model.layers.32.mlp.experts.156.down_proj", "model.layers.32.mlp.experts.157.down_proj", "model.layers.32.mlp.experts.158.down_proj", "model.layers.32.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.981665845960344e-05, "dbits": 1258291200 }, { "dkld": -4.8068910837173115e-05, "dbits": 2516582400 } ] }, { "idx": 195, "layers": [ "model.layers.33.self_attn.q_proj" ], "candidates": [ { "dkld": 2.3082457482816177e-05, "dbits": 62914560 }, { "dkld": 1.8895976245403637e-05, "dbits": 125829120 } ] }, { "idx": 196, "layers": [ "model.layers.33.self_attn.k_proj", "model.layers.33.self_attn.v_proj" ], "candidates": [ { "dkld": -3.61433019861572e-05, "dbits": 10485760 }, { "dkld": -3.6647357046603116e-05, "dbits": 20971520 } ] }, { "idx": 197, "layers": [ "model.layers.33.self_attn.o_proj" ], "candidates": [ { "dkld": -0.00020599928684532538, "dbits": 62914560 }, { "dkld": -0.000153018906712531, "dbits": 125829120 } ] }, { "idx": 198, "layers": [ "model.layers.33.mlp.shared_experts.gate_proj", "model.layers.33.mlp.shared_experts.up_proj", "model.layers.33.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.0002872178563848131, "dbits": 23592960 }, { "dkld": -0.00019021739717572927, "dbits": 47185920 } ] }, { "idx": 199, "layers": [ "model.layers.33.mlp.experts.0.gate_proj", "model.layers.33.mlp.experts.1.gate_proj", "model.layers.33.mlp.experts.2.gate_proj", "model.layers.33.mlp.experts.3.gate_proj", "model.layers.33.mlp.experts.4.gate_proj", "model.layers.33.mlp.experts.5.gate_proj", "model.layers.33.mlp.experts.6.gate_proj", "model.layers.33.mlp.experts.7.gate_proj", "model.layers.33.mlp.experts.8.gate_proj", "model.layers.33.mlp.experts.9.gate_proj", "model.layers.33.mlp.experts.10.gate_proj", "model.layers.33.mlp.experts.11.gate_proj", "model.layers.33.mlp.experts.12.gate_proj", "model.layers.33.mlp.experts.13.gate_proj", "model.layers.33.mlp.experts.14.gate_proj", "model.layers.33.mlp.experts.15.gate_proj", "model.layers.33.mlp.experts.16.gate_proj", "model.layers.33.mlp.experts.17.gate_proj", "model.layers.33.mlp.experts.18.gate_proj", "model.layers.33.mlp.experts.19.gate_proj", "model.layers.33.mlp.experts.20.gate_proj", "model.layers.33.mlp.experts.21.gate_proj", "model.layers.33.mlp.experts.22.gate_proj", "model.layers.33.mlp.experts.23.gate_proj", "model.layers.33.mlp.experts.24.gate_proj", "model.layers.33.mlp.experts.25.gate_proj", "model.layers.33.mlp.experts.26.gate_proj", "model.layers.33.mlp.experts.27.gate_proj", "model.layers.33.mlp.experts.28.gate_proj", "model.layers.33.mlp.experts.29.gate_proj", "model.layers.33.mlp.experts.30.gate_proj", "model.layers.33.mlp.experts.31.gate_proj", "model.layers.33.mlp.experts.32.gate_proj", "model.layers.33.mlp.experts.33.gate_proj", "model.layers.33.mlp.experts.34.gate_proj", "model.layers.33.mlp.experts.35.gate_proj", "model.layers.33.mlp.experts.36.gate_proj", "model.layers.33.mlp.experts.37.gate_proj", "model.layers.33.mlp.experts.38.gate_proj", "model.layers.33.mlp.experts.39.gate_proj", "model.layers.33.mlp.experts.40.gate_proj", "model.layers.33.mlp.experts.41.gate_proj", "model.layers.33.mlp.experts.42.gate_proj", "model.layers.33.mlp.experts.43.gate_proj", "model.layers.33.mlp.experts.44.gate_proj", "model.layers.33.mlp.experts.45.gate_proj", "model.layers.33.mlp.experts.46.gate_proj", "model.layers.33.mlp.experts.47.gate_proj", "model.layers.33.mlp.experts.48.gate_proj", "model.layers.33.mlp.experts.49.gate_proj", "model.layers.33.mlp.experts.50.gate_proj", "model.layers.33.mlp.experts.51.gate_proj", "model.layers.33.mlp.experts.52.gate_proj", "model.layers.33.mlp.experts.53.gate_proj", "model.layers.33.mlp.experts.54.gate_proj", "model.layers.33.mlp.experts.55.gate_proj", "model.layers.33.mlp.experts.56.gate_proj", "model.layers.33.mlp.experts.57.gate_proj", "model.layers.33.mlp.experts.58.gate_proj", "model.layers.33.mlp.experts.59.gate_proj", "model.layers.33.mlp.experts.60.gate_proj", "model.layers.33.mlp.experts.61.gate_proj", "model.layers.33.mlp.experts.62.gate_proj", "model.layers.33.mlp.experts.63.gate_proj", "model.layers.33.mlp.experts.64.gate_proj", "model.layers.33.mlp.experts.65.gate_proj", "model.layers.33.mlp.experts.66.gate_proj", "model.layers.33.mlp.experts.67.gate_proj", "model.layers.33.mlp.experts.68.gate_proj", "model.layers.33.mlp.experts.69.gate_proj", "model.layers.33.mlp.experts.70.gate_proj", "model.layers.33.mlp.experts.71.gate_proj", "model.layers.33.mlp.experts.72.gate_proj", "model.layers.33.mlp.experts.73.gate_proj", "model.layers.33.mlp.experts.74.gate_proj", "model.layers.33.mlp.experts.75.gate_proj", "model.layers.33.mlp.experts.76.gate_proj", "model.layers.33.mlp.experts.77.gate_proj", "model.layers.33.mlp.experts.78.gate_proj", "model.layers.33.mlp.experts.79.gate_proj", "model.layers.33.mlp.experts.80.gate_proj", "model.layers.33.mlp.experts.81.gate_proj", "model.layers.33.mlp.experts.82.gate_proj", "model.layers.33.mlp.experts.83.gate_proj", "model.layers.33.mlp.experts.84.gate_proj", "model.layers.33.mlp.experts.85.gate_proj", "model.layers.33.mlp.experts.86.gate_proj", "model.layers.33.mlp.experts.87.gate_proj", "model.layers.33.mlp.experts.88.gate_proj", "model.layers.33.mlp.experts.89.gate_proj", "model.layers.33.mlp.experts.90.gate_proj", "model.layers.33.mlp.experts.91.gate_proj", "model.layers.33.mlp.experts.92.gate_proj", "model.layers.33.mlp.experts.93.gate_proj", "model.layers.33.mlp.experts.94.gate_proj", "model.layers.33.mlp.experts.95.gate_proj", "model.layers.33.mlp.experts.96.gate_proj", "model.layers.33.mlp.experts.97.gate_proj", "model.layers.33.mlp.experts.98.gate_proj", "model.layers.33.mlp.experts.99.gate_proj", "model.layers.33.mlp.experts.100.gate_proj", "model.layers.33.mlp.experts.101.gate_proj", "model.layers.33.mlp.experts.102.gate_proj", "model.layers.33.mlp.experts.103.gate_proj", "model.layers.33.mlp.experts.104.gate_proj", "model.layers.33.mlp.experts.105.gate_proj", "model.layers.33.mlp.experts.106.gate_proj", "model.layers.33.mlp.experts.107.gate_proj", "model.layers.33.mlp.experts.108.gate_proj", "model.layers.33.mlp.experts.109.gate_proj", "model.layers.33.mlp.experts.110.gate_proj", "model.layers.33.mlp.experts.111.gate_proj", "model.layers.33.mlp.experts.112.gate_proj", "model.layers.33.mlp.experts.113.gate_proj", "model.layers.33.mlp.experts.114.gate_proj", "model.layers.33.mlp.experts.115.gate_proj", "model.layers.33.mlp.experts.116.gate_proj", "model.layers.33.mlp.experts.117.gate_proj", "model.layers.33.mlp.experts.118.gate_proj", "model.layers.33.mlp.experts.119.gate_proj", "model.layers.33.mlp.experts.120.gate_proj", "model.layers.33.mlp.experts.121.gate_proj", "model.layers.33.mlp.experts.122.gate_proj", "model.layers.33.mlp.experts.123.gate_proj", "model.layers.33.mlp.experts.124.gate_proj", "model.layers.33.mlp.experts.125.gate_proj", "model.layers.33.mlp.experts.126.gate_proj", "model.layers.33.mlp.experts.127.gate_proj", "model.layers.33.mlp.experts.128.gate_proj", "model.layers.33.mlp.experts.129.gate_proj", "model.layers.33.mlp.experts.130.gate_proj", "model.layers.33.mlp.experts.131.gate_proj", "model.layers.33.mlp.experts.132.gate_proj", "model.layers.33.mlp.experts.133.gate_proj", "model.layers.33.mlp.experts.134.gate_proj", "model.layers.33.mlp.experts.135.gate_proj", "model.layers.33.mlp.experts.136.gate_proj", "model.layers.33.mlp.experts.137.gate_proj", "model.layers.33.mlp.experts.138.gate_proj", "model.layers.33.mlp.experts.139.gate_proj", "model.layers.33.mlp.experts.140.gate_proj", "model.layers.33.mlp.experts.141.gate_proj", "model.layers.33.mlp.experts.142.gate_proj", "model.layers.33.mlp.experts.143.gate_proj", "model.layers.33.mlp.experts.144.gate_proj", "model.layers.33.mlp.experts.145.gate_proj", "model.layers.33.mlp.experts.146.gate_proj", "model.layers.33.mlp.experts.147.gate_proj", "model.layers.33.mlp.experts.148.gate_proj", "model.layers.33.mlp.experts.149.gate_proj", "model.layers.33.mlp.experts.150.gate_proj", "model.layers.33.mlp.experts.151.gate_proj", "model.layers.33.mlp.experts.152.gate_proj", "model.layers.33.mlp.experts.153.gate_proj", "model.layers.33.mlp.experts.154.gate_proj", "model.layers.33.mlp.experts.155.gate_proj", "model.layers.33.mlp.experts.156.gate_proj", "model.layers.33.mlp.experts.157.gate_proj", "model.layers.33.mlp.experts.158.gate_proj", "model.layers.33.mlp.experts.159.gate_proj", "model.layers.33.mlp.experts.0.up_proj", "model.layers.33.mlp.experts.1.up_proj", "model.layers.33.mlp.experts.2.up_proj", "model.layers.33.mlp.experts.3.up_proj", "model.layers.33.mlp.experts.4.up_proj", "model.layers.33.mlp.experts.5.up_proj", "model.layers.33.mlp.experts.6.up_proj", "model.layers.33.mlp.experts.7.up_proj", "model.layers.33.mlp.experts.8.up_proj", "model.layers.33.mlp.experts.9.up_proj", "model.layers.33.mlp.experts.10.up_proj", "model.layers.33.mlp.experts.11.up_proj", "model.layers.33.mlp.experts.12.up_proj", "model.layers.33.mlp.experts.13.up_proj", "model.layers.33.mlp.experts.14.up_proj", "model.layers.33.mlp.experts.15.up_proj", "model.layers.33.mlp.experts.16.up_proj", "model.layers.33.mlp.experts.17.up_proj", "model.layers.33.mlp.experts.18.up_proj", "model.layers.33.mlp.experts.19.up_proj", "model.layers.33.mlp.experts.20.up_proj", "model.layers.33.mlp.experts.21.up_proj", "model.layers.33.mlp.experts.22.up_proj", "model.layers.33.mlp.experts.23.up_proj", "model.layers.33.mlp.experts.24.up_proj", "model.layers.33.mlp.experts.25.up_proj", "model.layers.33.mlp.experts.26.up_proj", "model.layers.33.mlp.experts.27.up_proj", "model.layers.33.mlp.experts.28.up_proj", "model.layers.33.mlp.experts.29.up_proj", "model.layers.33.mlp.experts.30.up_proj", "model.layers.33.mlp.experts.31.up_proj", "model.layers.33.mlp.experts.32.up_proj", "model.layers.33.mlp.experts.33.up_proj", "model.layers.33.mlp.experts.34.up_proj", "model.layers.33.mlp.experts.35.up_proj", "model.layers.33.mlp.experts.36.up_proj", "model.layers.33.mlp.experts.37.up_proj", "model.layers.33.mlp.experts.38.up_proj", "model.layers.33.mlp.experts.39.up_proj", "model.layers.33.mlp.experts.40.up_proj", "model.layers.33.mlp.experts.41.up_proj", "model.layers.33.mlp.experts.42.up_proj", "model.layers.33.mlp.experts.43.up_proj", "model.layers.33.mlp.experts.44.up_proj", "model.layers.33.mlp.experts.45.up_proj", "model.layers.33.mlp.experts.46.up_proj", "model.layers.33.mlp.experts.47.up_proj", "model.layers.33.mlp.experts.48.up_proj", "model.layers.33.mlp.experts.49.up_proj", "model.layers.33.mlp.experts.50.up_proj", "model.layers.33.mlp.experts.51.up_proj", "model.layers.33.mlp.experts.52.up_proj", "model.layers.33.mlp.experts.53.up_proj", "model.layers.33.mlp.experts.54.up_proj", "model.layers.33.mlp.experts.55.up_proj", "model.layers.33.mlp.experts.56.up_proj", "model.layers.33.mlp.experts.57.up_proj", "model.layers.33.mlp.experts.58.up_proj", "model.layers.33.mlp.experts.59.up_proj", "model.layers.33.mlp.experts.60.up_proj", "model.layers.33.mlp.experts.61.up_proj", "model.layers.33.mlp.experts.62.up_proj", "model.layers.33.mlp.experts.63.up_proj", "model.layers.33.mlp.experts.64.up_proj", "model.layers.33.mlp.experts.65.up_proj", "model.layers.33.mlp.experts.66.up_proj", "model.layers.33.mlp.experts.67.up_proj", "model.layers.33.mlp.experts.68.up_proj", "model.layers.33.mlp.experts.69.up_proj", "model.layers.33.mlp.experts.70.up_proj", "model.layers.33.mlp.experts.71.up_proj", "model.layers.33.mlp.experts.72.up_proj", "model.layers.33.mlp.experts.73.up_proj", "model.layers.33.mlp.experts.74.up_proj", "model.layers.33.mlp.experts.75.up_proj", "model.layers.33.mlp.experts.76.up_proj", "model.layers.33.mlp.experts.77.up_proj", "model.layers.33.mlp.experts.78.up_proj", "model.layers.33.mlp.experts.79.up_proj", "model.layers.33.mlp.experts.80.up_proj", "model.layers.33.mlp.experts.81.up_proj", "model.layers.33.mlp.experts.82.up_proj", "model.layers.33.mlp.experts.83.up_proj", "model.layers.33.mlp.experts.84.up_proj", "model.layers.33.mlp.experts.85.up_proj", "model.layers.33.mlp.experts.86.up_proj", "model.layers.33.mlp.experts.87.up_proj", "model.layers.33.mlp.experts.88.up_proj", "model.layers.33.mlp.experts.89.up_proj", "model.layers.33.mlp.experts.90.up_proj", "model.layers.33.mlp.experts.91.up_proj", "model.layers.33.mlp.experts.92.up_proj", "model.layers.33.mlp.experts.93.up_proj", "model.layers.33.mlp.experts.94.up_proj", "model.layers.33.mlp.experts.95.up_proj", "model.layers.33.mlp.experts.96.up_proj", "model.layers.33.mlp.experts.97.up_proj", "model.layers.33.mlp.experts.98.up_proj", "model.layers.33.mlp.experts.99.up_proj", "model.layers.33.mlp.experts.100.up_proj", "model.layers.33.mlp.experts.101.up_proj", "model.layers.33.mlp.experts.102.up_proj", "model.layers.33.mlp.experts.103.up_proj", "model.layers.33.mlp.experts.104.up_proj", "model.layers.33.mlp.experts.105.up_proj", "model.layers.33.mlp.experts.106.up_proj", "model.layers.33.mlp.experts.107.up_proj", "model.layers.33.mlp.experts.108.up_proj", "model.layers.33.mlp.experts.109.up_proj", "model.layers.33.mlp.experts.110.up_proj", "model.layers.33.mlp.experts.111.up_proj", "model.layers.33.mlp.experts.112.up_proj", "model.layers.33.mlp.experts.113.up_proj", "model.layers.33.mlp.experts.114.up_proj", "model.layers.33.mlp.experts.115.up_proj", "model.layers.33.mlp.experts.116.up_proj", "model.layers.33.mlp.experts.117.up_proj", "model.layers.33.mlp.experts.118.up_proj", "model.layers.33.mlp.experts.119.up_proj", "model.layers.33.mlp.experts.120.up_proj", "model.layers.33.mlp.experts.121.up_proj", "model.layers.33.mlp.experts.122.up_proj", "model.layers.33.mlp.experts.123.up_proj", "model.layers.33.mlp.experts.124.up_proj", "model.layers.33.mlp.experts.125.up_proj", "model.layers.33.mlp.experts.126.up_proj", "model.layers.33.mlp.experts.127.up_proj", "model.layers.33.mlp.experts.128.up_proj", "model.layers.33.mlp.experts.129.up_proj", "model.layers.33.mlp.experts.130.up_proj", "model.layers.33.mlp.experts.131.up_proj", "model.layers.33.mlp.experts.132.up_proj", "model.layers.33.mlp.experts.133.up_proj", "model.layers.33.mlp.experts.134.up_proj", "model.layers.33.mlp.experts.135.up_proj", "model.layers.33.mlp.experts.136.up_proj", "model.layers.33.mlp.experts.137.up_proj", "model.layers.33.mlp.experts.138.up_proj", "model.layers.33.mlp.experts.139.up_proj", "model.layers.33.mlp.experts.140.up_proj", "model.layers.33.mlp.experts.141.up_proj", "model.layers.33.mlp.experts.142.up_proj", "model.layers.33.mlp.experts.143.up_proj", "model.layers.33.mlp.experts.144.up_proj", "model.layers.33.mlp.experts.145.up_proj", "model.layers.33.mlp.experts.146.up_proj", "model.layers.33.mlp.experts.147.up_proj", "model.layers.33.mlp.experts.148.up_proj", "model.layers.33.mlp.experts.149.up_proj", "model.layers.33.mlp.experts.150.up_proj", "model.layers.33.mlp.experts.151.up_proj", "model.layers.33.mlp.experts.152.up_proj", "model.layers.33.mlp.experts.153.up_proj", "model.layers.33.mlp.experts.154.up_proj", "model.layers.33.mlp.experts.155.up_proj", "model.layers.33.mlp.experts.156.up_proj", "model.layers.33.mlp.experts.157.up_proj", "model.layers.33.mlp.experts.158.up_proj", "model.layers.33.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.983706701546873e-05, "dbits": 2516582400 }, { "dkld": -7.006577216088668e-05, "dbits": 5033164800 } ] }, { "idx": 200, "layers": [ "model.layers.33.mlp.experts.0.down_proj", "model.layers.33.mlp.experts.1.down_proj", "model.layers.33.mlp.experts.2.down_proj", "model.layers.33.mlp.experts.3.down_proj", "model.layers.33.mlp.experts.4.down_proj", "model.layers.33.mlp.experts.5.down_proj", "model.layers.33.mlp.experts.6.down_proj", "model.layers.33.mlp.experts.7.down_proj", "model.layers.33.mlp.experts.8.down_proj", "model.layers.33.mlp.experts.9.down_proj", "model.layers.33.mlp.experts.10.down_proj", "model.layers.33.mlp.experts.11.down_proj", "model.layers.33.mlp.experts.12.down_proj", "model.layers.33.mlp.experts.13.down_proj", "model.layers.33.mlp.experts.14.down_proj", "model.layers.33.mlp.experts.15.down_proj", "model.layers.33.mlp.experts.16.down_proj", "model.layers.33.mlp.experts.17.down_proj", "model.layers.33.mlp.experts.18.down_proj", "model.layers.33.mlp.experts.19.down_proj", "model.layers.33.mlp.experts.20.down_proj", "model.layers.33.mlp.experts.21.down_proj", "model.layers.33.mlp.experts.22.down_proj", "model.layers.33.mlp.experts.23.down_proj", "model.layers.33.mlp.experts.24.down_proj", "model.layers.33.mlp.experts.25.down_proj", "model.layers.33.mlp.experts.26.down_proj", "model.layers.33.mlp.experts.27.down_proj", "model.layers.33.mlp.experts.28.down_proj", "model.layers.33.mlp.experts.29.down_proj", "model.layers.33.mlp.experts.30.down_proj", "model.layers.33.mlp.experts.31.down_proj", "model.layers.33.mlp.experts.32.down_proj", "model.layers.33.mlp.experts.33.down_proj", "model.layers.33.mlp.experts.34.down_proj", "model.layers.33.mlp.experts.35.down_proj", "model.layers.33.mlp.experts.36.down_proj", "model.layers.33.mlp.experts.37.down_proj", "model.layers.33.mlp.experts.38.down_proj", "model.layers.33.mlp.experts.39.down_proj", "model.layers.33.mlp.experts.40.down_proj", "model.layers.33.mlp.experts.41.down_proj", "model.layers.33.mlp.experts.42.down_proj", "model.layers.33.mlp.experts.43.down_proj", "model.layers.33.mlp.experts.44.down_proj", "model.layers.33.mlp.experts.45.down_proj", "model.layers.33.mlp.experts.46.down_proj", "model.layers.33.mlp.experts.47.down_proj", "model.layers.33.mlp.experts.48.down_proj", "model.layers.33.mlp.experts.49.down_proj", "model.layers.33.mlp.experts.50.down_proj", "model.layers.33.mlp.experts.51.down_proj", "model.layers.33.mlp.experts.52.down_proj", "model.layers.33.mlp.experts.53.down_proj", "model.layers.33.mlp.experts.54.down_proj", "model.layers.33.mlp.experts.55.down_proj", "model.layers.33.mlp.experts.56.down_proj", "model.layers.33.mlp.experts.57.down_proj", "model.layers.33.mlp.experts.58.down_proj", "model.layers.33.mlp.experts.59.down_proj", "model.layers.33.mlp.experts.60.down_proj", "model.layers.33.mlp.experts.61.down_proj", "model.layers.33.mlp.experts.62.down_proj", "model.layers.33.mlp.experts.63.down_proj", "model.layers.33.mlp.experts.64.down_proj", "model.layers.33.mlp.experts.65.down_proj", "model.layers.33.mlp.experts.66.down_proj", "model.layers.33.mlp.experts.67.down_proj", "model.layers.33.mlp.experts.68.down_proj", "model.layers.33.mlp.experts.69.down_proj", "model.layers.33.mlp.experts.70.down_proj", "model.layers.33.mlp.experts.71.down_proj", "model.layers.33.mlp.experts.72.down_proj", "model.layers.33.mlp.experts.73.down_proj", "model.layers.33.mlp.experts.74.down_proj", "model.layers.33.mlp.experts.75.down_proj", "model.layers.33.mlp.experts.76.down_proj", "model.layers.33.mlp.experts.77.down_proj", "model.layers.33.mlp.experts.78.down_proj", "model.layers.33.mlp.experts.79.down_proj", "model.layers.33.mlp.experts.80.down_proj", "model.layers.33.mlp.experts.81.down_proj", "model.layers.33.mlp.experts.82.down_proj", "model.layers.33.mlp.experts.83.down_proj", "model.layers.33.mlp.experts.84.down_proj", "model.layers.33.mlp.experts.85.down_proj", "model.layers.33.mlp.experts.86.down_proj", "model.layers.33.mlp.experts.87.down_proj", "model.layers.33.mlp.experts.88.down_proj", "model.layers.33.mlp.experts.89.down_proj", "model.layers.33.mlp.experts.90.down_proj", "model.layers.33.mlp.experts.91.down_proj", "model.layers.33.mlp.experts.92.down_proj", "model.layers.33.mlp.experts.93.down_proj", "model.layers.33.mlp.experts.94.down_proj", "model.layers.33.mlp.experts.95.down_proj", "model.layers.33.mlp.experts.96.down_proj", "model.layers.33.mlp.experts.97.down_proj", "model.layers.33.mlp.experts.98.down_proj", "model.layers.33.mlp.experts.99.down_proj", "model.layers.33.mlp.experts.100.down_proj", "model.layers.33.mlp.experts.101.down_proj", "model.layers.33.mlp.experts.102.down_proj", "model.layers.33.mlp.experts.103.down_proj", "model.layers.33.mlp.experts.104.down_proj", "model.layers.33.mlp.experts.105.down_proj", "model.layers.33.mlp.experts.106.down_proj", "model.layers.33.mlp.experts.107.down_proj", "model.layers.33.mlp.experts.108.down_proj", "model.layers.33.mlp.experts.109.down_proj", "model.layers.33.mlp.experts.110.down_proj", "model.layers.33.mlp.experts.111.down_proj", "model.layers.33.mlp.experts.112.down_proj", "model.layers.33.mlp.experts.113.down_proj", "model.layers.33.mlp.experts.114.down_proj", "model.layers.33.mlp.experts.115.down_proj", "model.layers.33.mlp.experts.116.down_proj", "model.layers.33.mlp.experts.117.down_proj", "model.layers.33.mlp.experts.118.down_proj", "model.layers.33.mlp.experts.119.down_proj", "model.layers.33.mlp.experts.120.down_proj", "model.layers.33.mlp.experts.121.down_proj", "model.layers.33.mlp.experts.122.down_proj", "model.layers.33.mlp.experts.123.down_proj", "model.layers.33.mlp.experts.124.down_proj", "model.layers.33.mlp.experts.125.down_proj", "model.layers.33.mlp.experts.126.down_proj", "model.layers.33.mlp.experts.127.down_proj", "model.layers.33.mlp.experts.128.down_proj", "model.layers.33.mlp.experts.129.down_proj", "model.layers.33.mlp.experts.130.down_proj", "model.layers.33.mlp.experts.131.down_proj", "model.layers.33.mlp.experts.132.down_proj", "model.layers.33.mlp.experts.133.down_proj", "model.layers.33.mlp.experts.134.down_proj", "model.layers.33.mlp.experts.135.down_proj", "model.layers.33.mlp.experts.136.down_proj", "model.layers.33.mlp.experts.137.down_proj", "model.layers.33.mlp.experts.138.down_proj", "model.layers.33.mlp.experts.139.down_proj", "model.layers.33.mlp.experts.140.down_proj", "model.layers.33.mlp.experts.141.down_proj", "model.layers.33.mlp.experts.142.down_proj", "model.layers.33.mlp.experts.143.down_proj", "model.layers.33.mlp.experts.144.down_proj", "model.layers.33.mlp.experts.145.down_proj", "model.layers.33.mlp.experts.146.down_proj", "model.layers.33.mlp.experts.147.down_proj", "model.layers.33.mlp.experts.148.down_proj", "model.layers.33.mlp.experts.149.down_proj", "model.layers.33.mlp.experts.150.down_proj", "model.layers.33.mlp.experts.151.down_proj", "model.layers.33.mlp.experts.152.down_proj", "model.layers.33.mlp.experts.153.down_proj", "model.layers.33.mlp.experts.154.down_proj", "model.layers.33.mlp.experts.155.down_proj", "model.layers.33.mlp.experts.156.down_proj", "model.layers.33.mlp.experts.157.down_proj", "model.layers.33.mlp.experts.158.down_proj", "model.layers.33.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -6.337370723485947e-05, "dbits": 1258291200 }, { "dkld": -5.066234152763943e-05, "dbits": 2516582400 } ] }, { "idx": 201, "layers": [ "model.layers.34.self_attn.q_proj" ], "candidates": [ { "dkld": -9.594142902642419e-05, "dbits": 62914560 }, { "dkld": -8.162332233041525e-05, "dbits": 125829120 } ] }, { "idx": 202, "layers": [ "model.layers.34.self_attn.k_proj", "model.layers.34.self_attn.v_proj" ], "candidates": [ { "dkld": -0.00013263337314128876, "dbits": 10485760 }, { "dkld": -8.548879995941977e-05, "dbits": 20971520 } ] }, { "idx": 203, "layers": [ "model.layers.34.self_attn.o_proj" ], "candidates": [ { "dkld": 9.380190167576109e-05, "dbits": 62914560 }, { "dkld": 8.101230487227509e-05, "dbits": 125829120 } ] }, { "idx": 204, "layers": [ "model.layers.34.mlp.shared_experts.gate_proj", "model.layers.34.mlp.shared_experts.up_proj", "model.layers.34.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.0002229623030871146, "dbits": 23592960 }, { "dkld": -0.0002226835116744038, "dbits": 47185920 } ] }, { "idx": 205, "layers": [ "model.layers.34.mlp.experts.0.gate_proj", "model.layers.34.mlp.experts.1.gate_proj", "model.layers.34.mlp.experts.2.gate_proj", "model.layers.34.mlp.experts.3.gate_proj", "model.layers.34.mlp.experts.4.gate_proj", "model.layers.34.mlp.experts.5.gate_proj", "model.layers.34.mlp.experts.6.gate_proj", "model.layers.34.mlp.experts.7.gate_proj", "model.layers.34.mlp.experts.8.gate_proj", "model.layers.34.mlp.experts.9.gate_proj", "model.layers.34.mlp.experts.10.gate_proj", "model.layers.34.mlp.experts.11.gate_proj", "model.layers.34.mlp.experts.12.gate_proj", "model.layers.34.mlp.experts.13.gate_proj", "model.layers.34.mlp.experts.14.gate_proj", "model.layers.34.mlp.experts.15.gate_proj", "model.layers.34.mlp.experts.16.gate_proj", "model.layers.34.mlp.experts.17.gate_proj", "model.layers.34.mlp.experts.18.gate_proj", "model.layers.34.mlp.experts.19.gate_proj", "model.layers.34.mlp.experts.20.gate_proj", "model.layers.34.mlp.experts.21.gate_proj", "model.layers.34.mlp.experts.22.gate_proj", "model.layers.34.mlp.experts.23.gate_proj", "model.layers.34.mlp.experts.24.gate_proj", "model.layers.34.mlp.experts.25.gate_proj", "model.layers.34.mlp.experts.26.gate_proj", "model.layers.34.mlp.experts.27.gate_proj", "model.layers.34.mlp.experts.28.gate_proj", "model.layers.34.mlp.experts.29.gate_proj", "model.layers.34.mlp.experts.30.gate_proj", "model.layers.34.mlp.experts.31.gate_proj", "model.layers.34.mlp.experts.32.gate_proj", "model.layers.34.mlp.experts.33.gate_proj", "model.layers.34.mlp.experts.34.gate_proj", "model.layers.34.mlp.experts.35.gate_proj", "model.layers.34.mlp.experts.36.gate_proj", "model.layers.34.mlp.experts.37.gate_proj", "model.layers.34.mlp.experts.38.gate_proj", "model.layers.34.mlp.experts.39.gate_proj", "model.layers.34.mlp.experts.40.gate_proj", "model.layers.34.mlp.experts.41.gate_proj", "model.layers.34.mlp.experts.42.gate_proj", "model.layers.34.mlp.experts.43.gate_proj", "model.layers.34.mlp.experts.44.gate_proj", "model.layers.34.mlp.experts.45.gate_proj", "model.layers.34.mlp.experts.46.gate_proj", "model.layers.34.mlp.experts.47.gate_proj", "model.layers.34.mlp.experts.48.gate_proj", "model.layers.34.mlp.experts.49.gate_proj", "model.layers.34.mlp.experts.50.gate_proj", "model.layers.34.mlp.experts.51.gate_proj", "model.layers.34.mlp.experts.52.gate_proj", "model.layers.34.mlp.experts.53.gate_proj", "model.layers.34.mlp.experts.54.gate_proj", "model.layers.34.mlp.experts.55.gate_proj", "model.layers.34.mlp.experts.56.gate_proj", "model.layers.34.mlp.experts.57.gate_proj", "model.layers.34.mlp.experts.58.gate_proj", "model.layers.34.mlp.experts.59.gate_proj", "model.layers.34.mlp.experts.60.gate_proj", "model.layers.34.mlp.experts.61.gate_proj", "model.layers.34.mlp.experts.62.gate_proj", "model.layers.34.mlp.experts.63.gate_proj", "model.layers.34.mlp.experts.64.gate_proj", "model.layers.34.mlp.experts.65.gate_proj", "model.layers.34.mlp.experts.66.gate_proj", "model.layers.34.mlp.experts.67.gate_proj", "model.layers.34.mlp.experts.68.gate_proj", "model.layers.34.mlp.experts.69.gate_proj", "model.layers.34.mlp.experts.70.gate_proj", "model.layers.34.mlp.experts.71.gate_proj", "model.layers.34.mlp.experts.72.gate_proj", "model.layers.34.mlp.experts.73.gate_proj", "model.layers.34.mlp.experts.74.gate_proj", "model.layers.34.mlp.experts.75.gate_proj", "model.layers.34.mlp.experts.76.gate_proj", "model.layers.34.mlp.experts.77.gate_proj", "model.layers.34.mlp.experts.78.gate_proj", "model.layers.34.mlp.experts.79.gate_proj", "model.layers.34.mlp.experts.80.gate_proj", "model.layers.34.mlp.experts.81.gate_proj", "model.layers.34.mlp.experts.82.gate_proj", "model.layers.34.mlp.experts.83.gate_proj", "model.layers.34.mlp.experts.84.gate_proj", "model.layers.34.mlp.experts.85.gate_proj", "model.layers.34.mlp.experts.86.gate_proj", "model.layers.34.mlp.experts.87.gate_proj", "model.layers.34.mlp.experts.88.gate_proj", "model.layers.34.mlp.experts.89.gate_proj", "model.layers.34.mlp.experts.90.gate_proj", "model.layers.34.mlp.experts.91.gate_proj", "model.layers.34.mlp.experts.92.gate_proj", "model.layers.34.mlp.experts.93.gate_proj", "model.layers.34.mlp.experts.94.gate_proj", "model.layers.34.mlp.experts.95.gate_proj", "model.layers.34.mlp.experts.96.gate_proj", "model.layers.34.mlp.experts.97.gate_proj", "model.layers.34.mlp.experts.98.gate_proj", "model.layers.34.mlp.experts.99.gate_proj", "model.layers.34.mlp.experts.100.gate_proj", "model.layers.34.mlp.experts.101.gate_proj", "model.layers.34.mlp.experts.102.gate_proj", "model.layers.34.mlp.experts.103.gate_proj", "model.layers.34.mlp.experts.104.gate_proj", "model.layers.34.mlp.experts.105.gate_proj", "model.layers.34.mlp.experts.106.gate_proj", "model.layers.34.mlp.experts.107.gate_proj", "model.layers.34.mlp.experts.108.gate_proj", "model.layers.34.mlp.experts.109.gate_proj", "model.layers.34.mlp.experts.110.gate_proj", "model.layers.34.mlp.experts.111.gate_proj", "model.layers.34.mlp.experts.112.gate_proj", "model.layers.34.mlp.experts.113.gate_proj", "model.layers.34.mlp.experts.114.gate_proj", "model.layers.34.mlp.experts.115.gate_proj", "model.layers.34.mlp.experts.116.gate_proj", "model.layers.34.mlp.experts.117.gate_proj", "model.layers.34.mlp.experts.118.gate_proj", "model.layers.34.mlp.experts.119.gate_proj", "model.layers.34.mlp.experts.120.gate_proj", "model.layers.34.mlp.experts.121.gate_proj", "model.layers.34.mlp.experts.122.gate_proj", "model.layers.34.mlp.experts.123.gate_proj", "model.layers.34.mlp.experts.124.gate_proj", "model.layers.34.mlp.experts.125.gate_proj", "model.layers.34.mlp.experts.126.gate_proj", "model.layers.34.mlp.experts.127.gate_proj", "model.layers.34.mlp.experts.128.gate_proj", "model.layers.34.mlp.experts.129.gate_proj", "model.layers.34.mlp.experts.130.gate_proj", "model.layers.34.mlp.experts.131.gate_proj", "model.layers.34.mlp.experts.132.gate_proj", "model.layers.34.mlp.experts.133.gate_proj", "model.layers.34.mlp.experts.134.gate_proj", "model.layers.34.mlp.experts.135.gate_proj", "model.layers.34.mlp.experts.136.gate_proj", "model.layers.34.mlp.experts.137.gate_proj", "model.layers.34.mlp.experts.138.gate_proj", "model.layers.34.mlp.experts.139.gate_proj", "model.layers.34.mlp.experts.140.gate_proj", "model.layers.34.mlp.experts.141.gate_proj", "model.layers.34.mlp.experts.142.gate_proj", "model.layers.34.mlp.experts.143.gate_proj", "model.layers.34.mlp.experts.144.gate_proj", "model.layers.34.mlp.experts.145.gate_proj", "model.layers.34.mlp.experts.146.gate_proj", "model.layers.34.mlp.experts.147.gate_proj", "model.layers.34.mlp.experts.148.gate_proj", "model.layers.34.mlp.experts.149.gate_proj", "model.layers.34.mlp.experts.150.gate_proj", "model.layers.34.mlp.experts.151.gate_proj", "model.layers.34.mlp.experts.152.gate_proj", "model.layers.34.mlp.experts.153.gate_proj", "model.layers.34.mlp.experts.154.gate_proj", "model.layers.34.mlp.experts.155.gate_proj", "model.layers.34.mlp.experts.156.gate_proj", "model.layers.34.mlp.experts.157.gate_proj", "model.layers.34.mlp.experts.158.gate_proj", "model.layers.34.mlp.experts.159.gate_proj", "model.layers.34.mlp.experts.0.up_proj", "model.layers.34.mlp.experts.1.up_proj", "model.layers.34.mlp.experts.2.up_proj", "model.layers.34.mlp.experts.3.up_proj", "model.layers.34.mlp.experts.4.up_proj", "model.layers.34.mlp.experts.5.up_proj", "model.layers.34.mlp.experts.6.up_proj", "model.layers.34.mlp.experts.7.up_proj", "model.layers.34.mlp.experts.8.up_proj", "model.layers.34.mlp.experts.9.up_proj", "model.layers.34.mlp.experts.10.up_proj", "model.layers.34.mlp.experts.11.up_proj", "model.layers.34.mlp.experts.12.up_proj", "model.layers.34.mlp.experts.13.up_proj", "model.layers.34.mlp.experts.14.up_proj", "model.layers.34.mlp.experts.15.up_proj", "model.layers.34.mlp.experts.16.up_proj", "model.layers.34.mlp.experts.17.up_proj", "model.layers.34.mlp.experts.18.up_proj", "model.layers.34.mlp.experts.19.up_proj", "model.layers.34.mlp.experts.20.up_proj", "model.layers.34.mlp.experts.21.up_proj", "model.layers.34.mlp.experts.22.up_proj", "model.layers.34.mlp.experts.23.up_proj", "model.layers.34.mlp.experts.24.up_proj", "model.layers.34.mlp.experts.25.up_proj", "model.layers.34.mlp.experts.26.up_proj", "model.layers.34.mlp.experts.27.up_proj", "model.layers.34.mlp.experts.28.up_proj", "model.layers.34.mlp.experts.29.up_proj", "model.layers.34.mlp.experts.30.up_proj", "model.layers.34.mlp.experts.31.up_proj", "model.layers.34.mlp.experts.32.up_proj", "model.layers.34.mlp.experts.33.up_proj", "model.layers.34.mlp.experts.34.up_proj", "model.layers.34.mlp.experts.35.up_proj", "model.layers.34.mlp.experts.36.up_proj", "model.layers.34.mlp.experts.37.up_proj", "model.layers.34.mlp.experts.38.up_proj", "model.layers.34.mlp.experts.39.up_proj", "model.layers.34.mlp.experts.40.up_proj", "model.layers.34.mlp.experts.41.up_proj", "model.layers.34.mlp.experts.42.up_proj", "model.layers.34.mlp.experts.43.up_proj", "model.layers.34.mlp.experts.44.up_proj", "model.layers.34.mlp.experts.45.up_proj", "model.layers.34.mlp.experts.46.up_proj", "model.layers.34.mlp.experts.47.up_proj", "model.layers.34.mlp.experts.48.up_proj", "model.layers.34.mlp.experts.49.up_proj", "model.layers.34.mlp.experts.50.up_proj", "model.layers.34.mlp.experts.51.up_proj", "model.layers.34.mlp.experts.52.up_proj", "model.layers.34.mlp.experts.53.up_proj", "model.layers.34.mlp.experts.54.up_proj", "model.layers.34.mlp.experts.55.up_proj", "model.layers.34.mlp.experts.56.up_proj", "model.layers.34.mlp.experts.57.up_proj", "model.layers.34.mlp.experts.58.up_proj", "model.layers.34.mlp.experts.59.up_proj", "model.layers.34.mlp.experts.60.up_proj", "model.layers.34.mlp.experts.61.up_proj", "model.layers.34.mlp.experts.62.up_proj", "model.layers.34.mlp.experts.63.up_proj", "model.layers.34.mlp.experts.64.up_proj", "model.layers.34.mlp.experts.65.up_proj", "model.layers.34.mlp.experts.66.up_proj", "model.layers.34.mlp.experts.67.up_proj", "model.layers.34.mlp.experts.68.up_proj", "model.layers.34.mlp.experts.69.up_proj", "model.layers.34.mlp.experts.70.up_proj", "model.layers.34.mlp.experts.71.up_proj", "model.layers.34.mlp.experts.72.up_proj", "model.layers.34.mlp.experts.73.up_proj", "model.layers.34.mlp.experts.74.up_proj", "model.layers.34.mlp.experts.75.up_proj", "model.layers.34.mlp.experts.76.up_proj", "model.layers.34.mlp.experts.77.up_proj", "model.layers.34.mlp.experts.78.up_proj", "model.layers.34.mlp.experts.79.up_proj", "model.layers.34.mlp.experts.80.up_proj", "model.layers.34.mlp.experts.81.up_proj", "model.layers.34.mlp.experts.82.up_proj", "model.layers.34.mlp.experts.83.up_proj", "model.layers.34.mlp.experts.84.up_proj", "model.layers.34.mlp.experts.85.up_proj", "model.layers.34.mlp.experts.86.up_proj", "model.layers.34.mlp.experts.87.up_proj", "model.layers.34.mlp.experts.88.up_proj", "model.layers.34.mlp.experts.89.up_proj", "model.layers.34.mlp.experts.90.up_proj", "model.layers.34.mlp.experts.91.up_proj", "model.layers.34.mlp.experts.92.up_proj", "model.layers.34.mlp.experts.93.up_proj", "model.layers.34.mlp.experts.94.up_proj", "model.layers.34.mlp.experts.95.up_proj", "model.layers.34.mlp.experts.96.up_proj", "model.layers.34.mlp.experts.97.up_proj", "model.layers.34.mlp.experts.98.up_proj", "model.layers.34.mlp.experts.99.up_proj", "model.layers.34.mlp.experts.100.up_proj", "model.layers.34.mlp.experts.101.up_proj", "model.layers.34.mlp.experts.102.up_proj", "model.layers.34.mlp.experts.103.up_proj", "model.layers.34.mlp.experts.104.up_proj", "model.layers.34.mlp.experts.105.up_proj", "model.layers.34.mlp.experts.106.up_proj", "model.layers.34.mlp.experts.107.up_proj", "model.layers.34.mlp.experts.108.up_proj", "model.layers.34.mlp.experts.109.up_proj", "model.layers.34.mlp.experts.110.up_proj", "model.layers.34.mlp.experts.111.up_proj", "model.layers.34.mlp.experts.112.up_proj", "model.layers.34.mlp.experts.113.up_proj", "model.layers.34.mlp.experts.114.up_proj", "model.layers.34.mlp.experts.115.up_proj", "model.layers.34.mlp.experts.116.up_proj", "model.layers.34.mlp.experts.117.up_proj", "model.layers.34.mlp.experts.118.up_proj", "model.layers.34.mlp.experts.119.up_proj", "model.layers.34.mlp.experts.120.up_proj", "model.layers.34.mlp.experts.121.up_proj", "model.layers.34.mlp.experts.122.up_proj", "model.layers.34.mlp.experts.123.up_proj", "model.layers.34.mlp.experts.124.up_proj", "model.layers.34.mlp.experts.125.up_proj", "model.layers.34.mlp.experts.126.up_proj", "model.layers.34.mlp.experts.127.up_proj", "model.layers.34.mlp.experts.128.up_proj", "model.layers.34.mlp.experts.129.up_proj", "model.layers.34.mlp.experts.130.up_proj", "model.layers.34.mlp.experts.131.up_proj", "model.layers.34.mlp.experts.132.up_proj", "model.layers.34.mlp.experts.133.up_proj", "model.layers.34.mlp.experts.134.up_proj", "model.layers.34.mlp.experts.135.up_proj", "model.layers.34.mlp.experts.136.up_proj", "model.layers.34.mlp.experts.137.up_proj", "model.layers.34.mlp.experts.138.up_proj", "model.layers.34.mlp.experts.139.up_proj", "model.layers.34.mlp.experts.140.up_proj", "model.layers.34.mlp.experts.141.up_proj", "model.layers.34.mlp.experts.142.up_proj", "model.layers.34.mlp.experts.143.up_proj", "model.layers.34.mlp.experts.144.up_proj", "model.layers.34.mlp.experts.145.up_proj", "model.layers.34.mlp.experts.146.up_proj", "model.layers.34.mlp.experts.147.up_proj", "model.layers.34.mlp.experts.148.up_proj", "model.layers.34.mlp.experts.149.up_proj", "model.layers.34.mlp.experts.150.up_proj", "model.layers.34.mlp.experts.151.up_proj", "model.layers.34.mlp.experts.152.up_proj", "model.layers.34.mlp.experts.153.up_proj", "model.layers.34.mlp.experts.154.up_proj", "model.layers.34.mlp.experts.155.up_proj", "model.layers.34.mlp.experts.156.up_proj", "model.layers.34.mlp.experts.157.up_proj", "model.layers.34.mlp.experts.158.up_proj", "model.layers.34.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -7.311792578548054e-05, "dbits": 2516582400 }, { "dkld": -5.236098077148095e-05, "dbits": 5033164800 } ] }, { "idx": 206, "layers": [ "model.layers.34.mlp.experts.0.down_proj", "model.layers.34.mlp.experts.1.down_proj", "model.layers.34.mlp.experts.2.down_proj", "model.layers.34.mlp.experts.3.down_proj", "model.layers.34.mlp.experts.4.down_proj", "model.layers.34.mlp.experts.5.down_proj", "model.layers.34.mlp.experts.6.down_proj", "model.layers.34.mlp.experts.7.down_proj", "model.layers.34.mlp.experts.8.down_proj", "model.layers.34.mlp.experts.9.down_proj", "model.layers.34.mlp.experts.10.down_proj", "model.layers.34.mlp.experts.11.down_proj", "model.layers.34.mlp.experts.12.down_proj", "model.layers.34.mlp.experts.13.down_proj", "model.layers.34.mlp.experts.14.down_proj", "model.layers.34.mlp.experts.15.down_proj", "model.layers.34.mlp.experts.16.down_proj", "model.layers.34.mlp.experts.17.down_proj", "model.layers.34.mlp.experts.18.down_proj", "model.layers.34.mlp.experts.19.down_proj", "model.layers.34.mlp.experts.20.down_proj", "model.layers.34.mlp.experts.21.down_proj", "model.layers.34.mlp.experts.22.down_proj", "model.layers.34.mlp.experts.23.down_proj", "model.layers.34.mlp.experts.24.down_proj", "model.layers.34.mlp.experts.25.down_proj", "model.layers.34.mlp.experts.26.down_proj", "model.layers.34.mlp.experts.27.down_proj", "model.layers.34.mlp.experts.28.down_proj", "model.layers.34.mlp.experts.29.down_proj", "model.layers.34.mlp.experts.30.down_proj", "model.layers.34.mlp.experts.31.down_proj", "model.layers.34.mlp.experts.32.down_proj", "model.layers.34.mlp.experts.33.down_proj", "model.layers.34.mlp.experts.34.down_proj", "model.layers.34.mlp.experts.35.down_proj", "model.layers.34.mlp.experts.36.down_proj", "model.layers.34.mlp.experts.37.down_proj", "model.layers.34.mlp.experts.38.down_proj", "model.layers.34.mlp.experts.39.down_proj", "model.layers.34.mlp.experts.40.down_proj", "model.layers.34.mlp.experts.41.down_proj", "model.layers.34.mlp.experts.42.down_proj", "model.layers.34.mlp.experts.43.down_proj", "model.layers.34.mlp.experts.44.down_proj", "model.layers.34.mlp.experts.45.down_proj", "model.layers.34.mlp.experts.46.down_proj", "model.layers.34.mlp.experts.47.down_proj", "model.layers.34.mlp.experts.48.down_proj", "model.layers.34.mlp.experts.49.down_proj", "model.layers.34.mlp.experts.50.down_proj", "model.layers.34.mlp.experts.51.down_proj", "model.layers.34.mlp.experts.52.down_proj", "model.layers.34.mlp.experts.53.down_proj", "model.layers.34.mlp.experts.54.down_proj", "model.layers.34.mlp.experts.55.down_proj", "model.layers.34.mlp.experts.56.down_proj", "model.layers.34.mlp.experts.57.down_proj", "model.layers.34.mlp.experts.58.down_proj", "model.layers.34.mlp.experts.59.down_proj", "model.layers.34.mlp.experts.60.down_proj", "model.layers.34.mlp.experts.61.down_proj", "model.layers.34.mlp.experts.62.down_proj", "model.layers.34.mlp.experts.63.down_proj", "model.layers.34.mlp.experts.64.down_proj", "model.layers.34.mlp.experts.65.down_proj", "model.layers.34.mlp.experts.66.down_proj", "model.layers.34.mlp.experts.67.down_proj", "model.layers.34.mlp.experts.68.down_proj", "model.layers.34.mlp.experts.69.down_proj", "model.layers.34.mlp.experts.70.down_proj", "model.layers.34.mlp.experts.71.down_proj", "model.layers.34.mlp.experts.72.down_proj", "model.layers.34.mlp.experts.73.down_proj", "model.layers.34.mlp.experts.74.down_proj", "model.layers.34.mlp.experts.75.down_proj", "model.layers.34.mlp.experts.76.down_proj", "model.layers.34.mlp.experts.77.down_proj", "model.layers.34.mlp.experts.78.down_proj", "model.layers.34.mlp.experts.79.down_proj", "model.layers.34.mlp.experts.80.down_proj", "model.layers.34.mlp.experts.81.down_proj", "model.layers.34.mlp.experts.82.down_proj", "model.layers.34.mlp.experts.83.down_proj", "model.layers.34.mlp.experts.84.down_proj", "model.layers.34.mlp.experts.85.down_proj", "model.layers.34.mlp.experts.86.down_proj", "model.layers.34.mlp.experts.87.down_proj", "model.layers.34.mlp.experts.88.down_proj", "model.layers.34.mlp.experts.89.down_proj", "model.layers.34.mlp.experts.90.down_proj", "model.layers.34.mlp.experts.91.down_proj", "model.layers.34.mlp.experts.92.down_proj", "model.layers.34.mlp.experts.93.down_proj", "model.layers.34.mlp.experts.94.down_proj", "model.layers.34.mlp.experts.95.down_proj", "model.layers.34.mlp.experts.96.down_proj", "model.layers.34.mlp.experts.97.down_proj", "model.layers.34.mlp.experts.98.down_proj", "model.layers.34.mlp.experts.99.down_proj", "model.layers.34.mlp.experts.100.down_proj", "model.layers.34.mlp.experts.101.down_proj", "model.layers.34.mlp.experts.102.down_proj", "model.layers.34.mlp.experts.103.down_proj", "model.layers.34.mlp.experts.104.down_proj", "model.layers.34.mlp.experts.105.down_proj", "model.layers.34.mlp.experts.106.down_proj", "model.layers.34.mlp.experts.107.down_proj", "model.layers.34.mlp.experts.108.down_proj", "model.layers.34.mlp.experts.109.down_proj", "model.layers.34.mlp.experts.110.down_proj", "model.layers.34.mlp.experts.111.down_proj", "model.layers.34.mlp.experts.112.down_proj", "model.layers.34.mlp.experts.113.down_proj", "model.layers.34.mlp.experts.114.down_proj", "model.layers.34.mlp.experts.115.down_proj", "model.layers.34.mlp.experts.116.down_proj", "model.layers.34.mlp.experts.117.down_proj", "model.layers.34.mlp.experts.118.down_proj", "model.layers.34.mlp.experts.119.down_proj", "model.layers.34.mlp.experts.120.down_proj", "model.layers.34.mlp.experts.121.down_proj", "model.layers.34.mlp.experts.122.down_proj", "model.layers.34.mlp.experts.123.down_proj", "model.layers.34.mlp.experts.124.down_proj", "model.layers.34.mlp.experts.125.down_proj", "model.layers.34.mlp.experts.126.down_proj", "model.layers.34.mlp.experts.127.down_proj", "model.layers.34.mlp.experts.128.down_proj", "model.layers.34.mlp.experts.129.down_proj", "model.layers.34.mlp.experts.130.down_proj", "model.layers.34.mlp.experts.131.down_proj", "model.layers.34.mlp.experts.132.down_proj", "model.layers.34.mlp.experts.133.down_proj", "model.layers.34.mlp.experts.134.down_proj", "model.layers.34.mlp.experts.135.down_proj", "model.layers.34.mlp.experts.136.down_proj", "model.layers.34.mlp.experts.137.down_proj", "model.layers.34.mlp.experts.138.down_proj", "model.layers.34.mlp.experts.139.down_proj", "model.layers.34.mlp.experts.140.down_proj", "model.layers.34.mlp.experts.141.down_proj", "model.layers.34.mlp.experts.142.down_proj", "model.layers.34.mlp.experts.143.down_proj", "model.layers.34.mlp.experts.144.down_proj", "model.layers.34.mlp.experts.145.down_proj", "model.layers.34.mlp.experts.146.down_proj", "model.layers.34.mlp.experts.147.down_proj", "model.layers.34.mlp.experts.148.down_proj", "model.layers.34.mlp.experts.149.down_proj", "model.layers.34.mlp.experts.150.down_proj", "model.layers.34.mlp.experts.151.down_proj", "model.layers.34.mlp.experts.152.down_proj", "model.layers.34.mlp.experts.153.down_proj", "model.layers.34.mlp.experts.154.down_proj", "model.layers.34.mlp.experts.155.down_proj", "model.layers.34.mlp.experts.156.down_proj", "model.layers.34.mlp.experts.157.down_proj", "model.layers.34.mlp.experts.158.down_proj", "model.layers.34.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -3.670030273496966e-05, "dbits": 1258291200 }, { "dkld": -4.819794557988505e-05, "dbits": 2516582400 } ] }, { "idx": 207, "layers": [ "model.layers.35.self_attn.q_proj" ], "candidates": [ { "dkld": -6.740386597812141e-05, "dbits": 62914560 }, { "dkld": -3.6030937917529496e-05, "dbits": 125829120 } ] }, { "idx": 208, "layers": [ "model.layers.35.self_attn.k_proj", "model.layers.35.self_attn.v_proj" ], "candidates": [ { "dkld": 0.0001825776649639014, "dbits": 10485760 }, { "dkld": 0.00017659799195826088, "dbits": 20971520 } ] }, { "idx": 209, "layers": [ "model.layers.35.self_attn.o_proj" ], "candidates": [ { "dkld": -0.0001803238876163949, "dbits": 62914560 }, { "dkld": -0.00016560130752622977, "dbits": 125829120 } ] }, { "idx": 210, "layers": [ "model.layers.35.mlp.shared_experts.gate_proj", "model.layers.35.mlp.shared_experts.up_proj", "model.layers.35.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.00011053984053432941, "dbits": 23592960 }, { "dkld": -3.5602180287240895e-05, "dbits": 47185920 } ] }, { "idx": 211, "layers": [ "model.layers.35.mlp.experts.0.gate_proj", "model.layers.35.mlp.experts.1.gate_proj", "model.layers.35.mlp.experts.2.gate_proj", "model.layers.35.mlp.experts.3.gate_proj", "model.layers.35.mlp.experts.4.gate_proj", "model.layers.35.mlp.experts.5.gate_proj", "model.layers.35.mlp.experts.6.gate_proj", "model.layers.35.mlp.experts.7.gate_proj", "model.layers.35.mlp.experts.8.gate_proj", "model.layers.35.mlp.experts.9.gate_proj", "model.layers.35.mlp.experts.10.gate_proj", "model.layers.35.mlp.experts.11.gate_proj", "model.layers.35.mlp.experts.12.gate_proj", "model.layers.35.mlp.experts.13.gate_proj", "model.layers.35.mlp.experts.14.gate_proj", "model.layers.35.mlp.experts.15.gate_proj", "model.layers.35.mlp.experts.16.gate_proj", "model.layers.35.mlp.experts.17.gate_proj", "model.layers.35.mlp.experts.18.gate_proj", "model.layers.35.mlp.experts.19.gate_proj", "model.layers.35.mlp.experts.20.gate_proj", "model.layers.35.mlp.experts.21.gate_proj", "model.layers.35.mlp.experts.22.gate_proj", "model.layers.35.mlp.experts.23.gate_proj", "model.layers.35.mlp.experts.24.gate_proj", "model.layers.35.mlp.experts.25.gate_proj", "model.layers.35.mlp.experts.26.gate_proj", "model.layers.35.mlp.experts.27.gate_proj", "model.layers.35.mlp.experts.28.gate_proj", "model.layers.35.mlp.experts.29.gate_proj", "model.layers.35.mlp.experts.30.gate_proj", "model.layers.35.mlp.experts.31.gate_proj", "model.layers.35.mlp.experts.32.gate_proj", "model.layers.35.mlp.experts.33.gate_proj", "model.layers.35.mlp.experts.34.gate_proj", "model.layers.35.mlp.experts.35.gate_proj", "model.layers.35.mlp.experts.36.gate_proj", "model.layers.35.mlp.experts.37.gate_proj", "model.layers.35.mlp.experts.38.gate_proj", "model.layers.35.mlp.experts.39.gate_proj", "model.layers.35.mlp.experts.40.gate_proj", "model.layers.35.mlp.experts.41.gate_proj", "model.layers.35.mlp.experts.42.gate_proj", "model.layers.35.mlp.experts.43.gate_proj", "model.layers.35.mlp.experts.44.gate_proj", "model.layers.35.mlp.experts.45.gate_proj", "model.layers.35.mlp.experts.46.gate_proj", "model.layers.35.mlp.experts.47.gate_proj", "model.layers.35.mlp.experts.48.gate_proj", "model.layers.35.mlp.experts.49.gate_proj", "model.layers.35.mlp.experts.50.gate_proj", "model.layers.35.mlp.experts.51.gate_proj", "model.layers.35.mlp.experts.52.gate_proj", "model.layers.35.mlp.experts.53.gate_proj", "model.layers.35.mlp.experts.54.gate_proj", "model.layers.35.mlp.experts.55.gate_proj", "model.layers.35.mlp.experts.56.gate_proj", "model.layers.35.mlp.experts.57.gate_proj", "model.layers.35.mlp.experts.58.gate_proj", "model.layers.35.mlp.experts.59.gate_proj", "model.layers.35.mlp.experts.60.gate_proj", "model.layers.35.mlp.experts.61.gate_proj", "model.layers.35.mlp.experts.62.gate_proj", "model.layers.35.mlp.experts.63.gate_proj", "model.layers.35.mlp.experts.64.gate_proj", "model.layers.35.mlp.experts.65.gate_proj", "model.layers.35.mlp.experts.66.gate_proj", "model.layers.35.mlp.experts.67.gate_proj", "model.layers.35.mlp.experts.68.gate_proj", "model.layers.35.mlp.experts.69.gate_proj", "model.layers.35.mlp.experts.70.gate_proj", "model.layers.35.mlp.experts.71.gate_proj", "model.layers.35.mlp.experts.72.gate_proj", "model.layers.35.mlp.experts.73.gate_proj", "model.layers.35.mlp.experts.74.gate_proj", "model.layers.35.mlp.experts.75.gate_proj", "model.layers.35.mlp.experts.76.gate_proj", "model.layers.35.mlp.experts.77.gate_proj", "model.layers.35.mlp.experts.78.gate_proj", "model.layers.35.mlp.experts.79.gate_proj", "model.layers.35.mlp.experts.80.gate_proj", "model.layers.35.mlp.experts.81.gate_proj", "model.layers.35.mlp.experts.82.gate_proj", "model.layers.35.mlp.experts.83.gate_proj", "model.layers.35.mlp.experts.84.gate_proj", "model.layers.35.mlp.experts.85.gate_proj", "model.layers.35.mlp.experts.86.gate_proj", "model.layers.35.mlp.experts.87.gate_proj", "model.layers.35.mlp.experts.88.gate_proj", "model.layers.35.mlp.experts.89.gate_proj", "model.layers.35.mlp.experts.90.gate_proj", "model.layers.35.mlp.experts.91.gate_proj", "model.layers.35.mlp.experts.92.gate_proj", "model.layers.35.mlp.experts.93.gate_proj", "model.layers.35.mlp.experts.94.gate_proj", "model.layers.35.mlp.experts.95.gate_proj", "model.layers.35.mlp.experts.96.gate_proj", "model.layers.35.mlp.experts.97.gate_proj", "model.layers.35.mlp.experts.98.gate_proj", "model.layers.35.mlp.experts.99.gate_proj", "model.layers.35.mlp.experts.100.gate_proj", "model.layers.35.mlp.experts.101.gate_proj", "model.layers.35.mlp.experts.102.gate_proj", "model.layers.35.mlp.experts.103.gate_proj", "model.layers.35.mlp.experts.104.gate_proj", "model.layers.35.mlp.experts.105.gate_proj", "model.layers.35.mlp.experts.106.gate_proj", "model.layers.35.mlp.experts.107.gate_proj", "model.layers.35.mlp.experts.108.gate_proj", "model.layers.35.mlp.experts.109.gate_proj", "model.layers.35.mlp.experts.110.gate_proj", "model.layers.35.mlp.experts.111.gate_proj", "model.layers.35.mlp.experts.112.gate_proj", "model.layers.35.mlp.experts.113.gate_proj", "model.layers.35.mlp.experts.114.gate_proj", "model.layers.35.mlp.experts.115.gate_proj", "model.layers.35.mlp.experts.116.gate_proj", "model.layers.35.mlp.experts.117.gate_proj", "model.layers.35.mlp.experts.118.gate_proj", "model.layers.35.mlp.experts.119.gate_proj", "model.layers.35.mlp.experts.120.gate_proj", "model.layers.35.mlp.experts.121.gate_proj", "model.layers.35.mlp.experts.122.gate_proj", "model.layers.35.mlp.experts.123.gate_proj", "model.layers.35.mlp.experts.124.gate_proj", "model.layers.35.mlp.experts.125.gate_proj", "model.layers.35.mlp.experts.126.gate_proj", "model.layers.35.mlp.experts.127.gate_proj", "model.layers.35.mlp.experts.128.gate_proj", "model.layers.35.mlp.experts.129.gate_proj", "model.layers.35.mlp.experts.130.gate_proj", "model.layers.35.mlp.experts.131.gate_proj", "model.layers.35.mlp.experts.132.gate_proj", "model.layers.35.mlp.experts.133.gate_proj", "model.layers.35.mlp.experts.134.gate_proj", "model.layers.35.mlp.experts.135.gate_proj", "model.layers.35.mlp.experts.136.gate_proj", "model.layers.35.mlp.experts.137.gate_proj", "model.layers.35.mlp.experts.138.gate_proj", "model.layers.35.mlp.experts.139.gate_proj", "model.layers.35.mlp.experts.140.gate_proj", "model.layers.35.mlp.experts.141.gate_proj", "model.layers.35.mlp.experts.142.gate_proj", "model.layers.35.mlp.experts.143.gate_proj", "model.layers.35.mlp.experts.144.gate_proj", "model.layers.35.mlp.experts.145.gate_proj", "model.layers.35.mlp.experts.146.gate_proj", "model.layers.35.mlp.experts.147.gate_proj", "model.layers.35.mlp.experts.148.gate_proj", "model.layers.35.mlp.experts.149.gate_proj", "model.layers.35.mlp.experts.150.gate_proj", "model.layers.35.mlp.experts.151.gate_proj", "model.layers.35.mlp.experts.152.gate_proj", "model.layers.35.mlp.experts.153.gate_proj", "model.layers.35.mlp.experts.154.gate_proj", "model.layers.35.mlp.experts.155.gate_proj", "model.layers.35.mlp.experts.156.gate_proj", "model.layers.35.mlp.experts.157.gate_proj", "model.layers.35.mlp.experts.158.gate_proj", "model.layers.35.mlp.experts.159.gate_proj", "model.layers.35.mlp.experts.0.up_proj", "model.layers.35.mlp.experts.1.up_proj", "model.layers.35.mlp.experts.2.up_proj", "model.layers.35.mlp.experts.3.up_proj", "model.layers.35.mlp.experts.4.up_proj", "model.layers.35.mlp.experts.5.up_proj", "model.layers.35.mlp.experts.6.up_proj", "model.layers.35.mlp.experts.7.up_proj", "model.layers.35.mlp.experts.8.up_proj", "model.layers.35.mlp.experts.9.up_proj", "model.layers.35.mlp.experts.10.up_proj", "model.layers.35.mlp.experts.11.up_proj", "model.layers.35.mlp.experts.12.up_proj", "model.layers.35.mlp.experts.13.up_proj", "model.layers.35.mlp.experts.14.up_proj", "model.layers.35.mlp.experts.15.up_proj", "model.layers.35.mlp.experts.16.up_proj", "model.layers.35.mlp.experts.17.up_proj", "model.layers.35.mlp.experts.18.up_proj", "model.layers.35.mlp.experts.19.up_proj", "model.layers.35.mlp.experts.20.up_proj", "model.layers.35.mlp.experts.21.up_proj", "model.layers.35.mlp.experts.22.up_proj", "model.layers.35.mlp.experts.23.up_proj", "model.layers.35.mlp.experts.24.up_proj", "model.layers.35.mlp.experts.25.up_proj", "model.layers.35.mlp.experts.26.up_proj", "model.layers.35.mlp.experts.27.up_proj", "model.layers.35.mlp.experts.28.up_proj", "model.layers.35.mlp.experts.29.up_proj", "model.layers.35.mlp.experts.30.up_proj", "model.layers.35.mlp.experts.31.up_proj", "model.layers.35.mlp.experts.32.up_proj", "model.layers.35.mlp.experts.33.up_proj", "model.layers.35.mlp.experts.34.up_proj", "model.layers.35.mlp.experts.35.up_proj", "model.layers.35.mlp.experts.36.up_proj", "model.layers.35.mlp.experts.37.up_proj", "model.layers.35.mlp.experts.38.up_proj", "model.layers.35.mlp.experts.39.up_proj", "model.layers.35.mlp.experts.40.up_proj", "model.layers.35.mlp.experts.41.up_proj", "model.layers.35.mlp.experts.42.up_proj", "model.layers.35.mlp.experts.43.up_proj", "model.layers.35.mlp.experts.44.up_proj", "model.layers.35.mlp.experts.45.up_proj", "model.layers.35.mlp.experts.46.up_proj", "model.layers.35.mlp.experts.47.up_proj", "model.layers.35.mlp.experts.48.up_proj", "model.layers.35.mlp.experts.49.up_proj", "model.layers.35.mlp.experts.50.up_proj", "model.layers.35.mlp.experts.51.up_proj", "model.layers.35.mlp.experts.52.up_proj", "model.layers.35.mlp.experts.53.up_proj", "model.layers.35.mlp.experts.54.up_proj", "model.layers.35.mlp.experts.55.up_proj", "model.layers.35.mlp.experts.56.up_proj", "model.layers.35.mlp.experts.57.up_proj", "model.layers.35.mlp.experts.58.up_proj", "model.layers.35.mlp.experts.59.up_proj", "model.layers.35.mlp.experts.60.up_proj", "model.layers.35.mlp.experts.61.up_proj", "model.layers.35.mlp.experts.62.up_proj", "model.layers.35.mlp.experts.63.up_proj", "model.layers.35.mlp.experts.64.up_proj", "model.layers.35.mlp.experts.65.up_proj", "model.layers.35.mlp.experts.66.up_proj", "model.layers.35.mlp.experts.67.up_proj", "model.layers.35.mlp.experts.68.up_proj", "model.layers.35.mlp.experts.69.up_proj", "model.layers.35.mlp.experts.70.up_proj", "model.layers.35.mlp.experts.71.up_proj", "model.layers.35.mlp.experts.72.up_proj", "model.layers.35.mlp.experts.73.up_proj", "model.layers.35.mlp.experts.74.up_proj", "model.layers.35.mlp.experts.75.up_proj", "model.layers.35.mlp.experts.76.up_proj", "model.layers.35.mlp.experts.77.up_proj", "model.layers.35.mlp.experts.78.up_proj", "model.layers.35.mlp.experts.79.up_proj", "model.layers.35.mlp.experts.80.up_proj", "model.layers.35.mlp.experts.81.up_proj", "model.layers.35.mlp.experts.82.up_proj", "model.layers.35.mlp.experts.83.up_proj", "model.layers.35.mlp.experts.84.up_proj", "model.layers.35.mlp.experts.85.up_proj", "model.layers.35.mlp.experts.86.up_proj", "model.layers.35.mlp.experts.87.up_proj", "model.layers.35.mlp.experts.88.up_proj", "model.layers.35.mlp.experts.89.up_proj", "model.layers.35.mlp.experts.90.up_proj", "model.layers.35.mlp.experts.91.up_proj", "model.layers.35.mlp.experts.92.up_proj", "model.layers.35.mlp.experts.93.up_proj", "model.layers.35.mlp.experts.94.up_proj", "model.layers.35.mlp.experts.95.up_proj", "model.layers.35.mlp.experts.96.up_proj", "model.layers.35.mlp.experts.97.up_proj", "model.layers.35.mlp.experts.98.up_proj", "model.layers.35.mlp.experts.99.up_proj", "model.layers.35.mlp.experts.100.up_proj", "model.layers.35.mlp.experts.101.up_proj", "model.layers.35.mlp.experts.102.up_proj", "model.layers.35.mlp.experts.103.up_proj", "model.layers.35.mlp.experts.104.up_proj", "model.layers.35.mlp.experts.105.up_proj", "model.layers.35.mlp.experts.106.up_proj", "model.layers.35.mlp.experts.107.up_proj", "model.layers.35.mlp.experts.108.up_proj", "model.layers.35.mlp.experts.109.up_proj", "model.layers.35.mlp.experts.110.up_proj", "model.layers.35.mlp.experts.111.up_proj", "model.layers.35.mlp.experts.112.up_proj", "model.layers.35.mlp.experts.113.up_proj", "model.layers.35.mlp.experts.114.up_proj", "model.layers.35.mlp.experts.115.up_proj", "model.layers.35.mlp.experts.116.up_proj", "model.layers.35.mlp.experts.117.up_proj", "model.layers.35.mlp.experts.118.up_proj", "model.layers.35.mlp.experts.119.up_proj", "model.layers.35.mlp.experts.120.up_proj", "model.layers.35.mlp.experts.121.up_proj", "model.layers.35.mlp.experts.122.up_proj", "model.layers.35.mlp.experts.123.up_proj", "model.layers.35.mlp.experts.124.up_proj", "model.layers.35.mlp.experts.125.up_proj", "model.layers.35.mlp.experts.126.up_proj", "model.layers.35.mlp.experts.127.up_proj", "model.layers.35.mlp.experts.128.up_proj", "model.layers.35.mlp.experts.129.up_proj", "model.layers.35.mlp.experts.130.up_proj", "model.layers.35.mlp.experts.131.up_proj", "model.layers.35.mlp.experts.132.up_proj", "model.layers.35.mlp.experts.133.up_proj", "model.layers.35.mlp.experts.134.up_proj", "model.layers.35.mlp.experts.135.up_proj", "model.layers.35.mlp.experts.136.up_proj", "model.layers.35.mlp.experts.137.up_proj", "model.layers.35.mlp.experts.138.up_proj", "model.layers.35.mlp.experts.139.up_proj", "model.layers.35.mlp.experts.140.up_proj", "model.layers.35.mlp.experts.141.up_proj", "model.layers.35.mlp.experts.142.up_proj", "model.layers.35.mlp.experts.143.up_proj", "model.layers.35.mlp.experts.144.up_proj", "model.layers.35.mlp.experts.145.up_proj", "model.layers.35.mlp.experts.146.up_proj", "model.layers.35.mlp.experts.147.up_proj", "model.layers.35.mlp.experts.148.up_proj", "model.layers.35.mlp.experts.149.up_proj", "model.layers.35.mlp.experts.150.up_proj", "model.layers.35.mlp.experts.151.up_proj", "model.layers.35.mlp.experts.152.up_proj", "model.layers.35.mlp.experts.153.up_proj", "model.layers.35.mlp.experts.154.up_proj", "model.layers.35.mlp.experts.155.up_proj", "model.layers.35.mlp.experts.156.up_proj", "model.layers.35.mlp.experts.157.up_proj", "model.layers.35.mlp.experts.158.up_proj", "model.layers.35.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -4.976368509232963e-05, "dbits": 2516582400 }, { "dkld": -9.78159485384815e-05, "dbits": 5033164800 } ] }, { "idx": 212, "layers": [ "model.layers.35.mlp.experts.0.down_proj", "model.layers.35.mlp.experts.1.down_proj", "model.layers.35.mlp.experts.2.down_proj", "model.layers.35.mlp.experts.3.down_proj", "model.layers.35.mlp.experts.4.down_proj", "model.layers.35.mlp.experts.5.down_proj", "model.layers.35.mlp.experts.6.down_proj", "model.layers.35.mlp.experts.7.down_proj", "model.layers.35.mlp.experts.8.down_proj", "model.layers.35.mlp.experts.9.down_proj", "model.layers.35.mlp.experts.10.down_proj", "model.layers.35.mlp.experts.11.down_proj", "model.layers.35.mlp.experts.12.down_proj", "model.layers.35.mlp.experts.13.down_proj", "model.layers.35.mlp.experts.14.down_proj", "model.layers.35.mlp.experts.15.down_proj", "model.layers.35.mlp.experts.16.down_proj", "model.layers.35.mlp.experts.17.down_proj", "model.layers.35.mlp.experts.18.down_proj", "model.layers.35.mlp.experts.19.down_proj", "model.layers.35.mlp.experts.20.down_proj", "model.layers.35.mlp.experts.21.down_proj", "model.layers.35.mlp.experts.22.down_proj", "model.layers.35.mlp.experts.23.down_proj", "model.layers.35.mlp.experts.24.down_proj", "model.layers.35.mlp.experts.25.down_proj", "model.layers.35.mlp.experts.26.down_proj", "model.layers.35.mlp.experts.27.down_proj", "model.layers.35.mlp.experts.28.down_proj", "model.layers.35.mlp.experts.29.down_proj", "model.layers.35.mlp.experts.30.down_proj", "model.layers.35.mlp.experts.31.down_proj", "model.layers.35.mlp.experts.32.down_proj", "model.layers.35.mlp.experts.33.down_proj", "model.layers.35.mlp.experts.34.down_proj", "model.layers.35.mlp.experts.35.down_proj", "model.layers.35.mlp.experts.36.down_proj", "model.layers.35.mlp.experts.37.down_proj", "model.layers.35.mlp.experts.38.down_proj", "model.layers.35.mlp.experts.39.down_proj", "model.layers.35.mlp.experts.40.down_proj", "model.layers.35.mlp.experts.41.down_proj", "model.layers.35.mlp.experts.42.down_proj", "model.layers.35.mlp.experts.43.down_proj", "model.layers.35.mlp.experts.44.down_proj", "model.layers.35.mlp.experts.45.down_proj", "model.layers.35.mlp.experts.46.down_proj", "model.layers.35.mlp.experts.47.down_proj", "model.layers.35.mlp.experts.48.down_proj", "model.layers.35.mlp.experts.49.down_proj", "model.layers.35.mlp.experts.50.down_proj", "model.layers.35.mlp.experts.51.down_proj", "model.layers.35.mlp.experts.52.down_proj", "model.layers.35.mlp.experts.53.down_proj", "model.layers.35.mlp.experts.54.down_proj", "model.layers.35.mlp.experts.55.down_proj", "model.layers.35.mlp.experts.56.down_proj", "model.layers.35.mlp.experts.57.down_proj", "model.layers.35.mlp.experts.58.down_proj", "model.layers.35.mlp.experts.59.down_proj", "model.layers.35.mlp.experts.60.down_proj", "model.layers.35.mlp.experts.61.down_proj", "model.layers.35.mlp.experts.62.down_proj", "model.layers.35.mlp.experts.63.down_proj", "model.layers.35.mlp.experts.64.down_proj", "model.layers.35.mlp.experts.65.down_proj", "model.layers.35.mlp.experts.66.down_proj", "model.layers.35.mlp.experts.67.down_proj", "model.layers.35.mlp.experts.68.down_proj", "model.layers.35.mlp.experts.69.down_proj", "model.layers.35.mlp.experts.70.down_proj", "model.layers.35.mlp.experts.71.down_proj", "model.layers.35.mlp.experts.72.down_proj", "model.layers.35.mlp.experts.73.down_proj", "model.layers.35.mlp.experts.74.down_proj", "model.layers.35.mlp.experts.75.down_proj", "model.layers.35.mlp.experts.76.down_proj", "model.layers.35.mlp.experts.77.down_proj", "model.layers.35.mlp.experts.78.down_proj", "model.layers.35.mlp.experts.79.down_proj", "model.layers.35.mlp.experts.80.down_proj", "model.layers.35.mlp.experts.81.down_proj", "model.layers.35.mlp.experts.82.down_proj", "model.layers.35.mlp.experts.83.down_proj", "model.layers.35.mlp.experts.84.down_proj", "model.layers.35.mlp.experts.85.down_proj", "model.layers.35.mlp.experts.86.down_proj", "model.layers.35.mlp.experts.87.down_proj", "model.layers.35.mlp.experts.88.down_proj", "model.layers.35.mlp.experts.89.down_proj", "model.layers.35.mlp.experts.90.down_proj", "model.layers.35.mlp.experts.91.down_proj", "model.layers.35.mlp.experts.92.down_proj", "model.layers.35.mlp.experts.93.down_proj", "model.layers.35.mlp.experts.94.down_proj", "model.layers.35.mlp.experts.95.down_proj", "model.layers.35.mlp.experts.96.down_proj", "model.layers.35.mlp.experts.97.down_proj", "model.layers.35.mlp.experts.98.down_proj", "model.layers.35.mlp.experts.99.down_proj", "model.layers.35.mlp.experts.100.down_proj", "model.layers.35.mlp.experts.101.down_proj", "model.layers.35.mlp.experts.102.down_proj", "model.layers.35.mlp.experts.103.down_proj", "model.layers.35.mlp.experts.104.down_proj", "model.layers.35.mlp.experts.105.down_proj", "model.layers.35.mlp.experts.106.down_proj", "model.layers.35.mlp.experts.107.down_proj", "model.layers.35.mlp.experts.108.down_proj", "model.layers.35.mlp.experts.109.down_proj", "model.layers.35.mlp.experts.110.down_proj", "model.layers.35.mlp.experts.111.down_proj", "model.layers.35.mlp.experts.112.down_proj", "model.layers.35.mlp.experts.113.down_proj", "model.layers.35.mlp.experts.114.down_proj", "model.layers.35.mlp.experts.115.down_proj", "model.layers.35.mlp.experts.116.down_proj", "model.layers.35.mlp.experts.117.down_proj", "model.layers.35.mlp.experts.118.down_proj", "model.layers.35.mlp.experts.119.down_proj", "model.layers.35.mlp.experts.120.down_proj", "model.layers.35.mlp.experts.121.down_proj", "model.layers.35.mlp.experts.122.down_proj", "model.layers.35.mlp.experts.123.down_proj", "model.layers.35.mlp.experts.124.down_proj", "model.layers.35.mlp.experts.125.down_proj", "model.layers.35.mlp.experts.126.down_proj", "model.layers.35.mlp.experts.127.down_proj", "model.layers.35.mlp.experts.128.down_proj", "model.layers.35.mlp.experts.129.down_proj", "model.layers.35.mlp.experts.130.down_proj", "model.layers.35.mlp.experts.131.down_proj", "model.layers.35.mlp.experts.132.down_proj", "model.layers.35.mlp.experts.133.down_proj", "model.layers.35.mlp.experts.134.down_proj", "model.layers.35.mlp.experts.135.down_proj", "model.layers.35.mlp.experts.136.down_proj", "model.layers.35.mlp.experts.137.down_proj", "model.layers.35.mlp.experts.138.down_proj", "model.layers.35.mlp.experts.139.down_proj", "model.layers.35.mlp.experts.140.down_proj", "model.layers.35.mlp.experts.141.down_proj", "model.layers.35.mlp.experts.142.down_proj", "model.layers.35.mlp.experts.143.down_proj", "model.layers.35.mlp.experts.144.down_proj", "model.layers.35.mlp.experts.145.down_proj", "model.layers.35.mlp.experts.146.down_proj", "model.layers.35.mlp.experts.147.down_proj", "model.layers.35.mlp.experts.148.down_proj", "model.layers.35.mlp.experts.149.down_proj", "model.layers.35.mlp.experts.150.down_proj", "model.layers.35.mlp.experts.151.down_proj", "model.layers.35.mlp.experts.152.down_proj", "model.layers.35.mlp.experts.153.down_proj", "model.layers.35.mlp.experts.154.down_proj", "model.layers.35.mlp.experts.155.down_proj", "model.layers.35.mlp.experts.156.down_proj", "model.layers.35.mlp.experts.157.down_proj", "model.layers.35.mlp.experts.158.down_proj", "model.layers.35.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -5.4096849635242375e-05, "dbits": 1258291200 }, { "dkld": -4.0004635229705376e-05, "dbits": 2516582400 } ] }, { "idx": 213, "layers": [ "model.layers.36.self_attn.q_proj" ], "candidates": [ { "dkld": -7.257098332043993e-07, "dbits": 62914560 }, { "dkld": -0.00013303135056048562, "dbits": 125829120 } ] }, { "idx": 214, "layers": [ "model.layers.36.self_attn.k_proj", "model.layers.36.self_attn.v_proj" ], "candidates": [ { "dkld": -0.0006006648531183597, "dbits": 10485760 }, { "dkld": -0.0005469539668411013, "dbits": 20971520 } ] }, { "idx": 215, "layers": [ "model.layers.36.self_attn.o_proj" ], "candidates": [ { "dkld": -0.00011804299429058959, "dbits": 62914560 }, { "dkld": -0.0001192359020933502, "dbits": 125829120 } ] }, { "idx": 216, "layers": [ "model.layers.36.mlp.shared_experts.gate_proj", "model.layers.36.mlp.shared_experts.up_proj", "model.layers.36.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 5.553117953240906e-05, "dbits": 23592960 }, { "dkld": 1.2895883992315726e-05, "dbits": 47185920 } ] }, { "idx": 217, "layers": [ "model.layers.36.mlp.experts.0.gate_proj", "model.layers.36.mlp.experts.1.gate_proj", "model.layers.36.mlp.experts.2.gate_proj", "model.layers.36.mlp.experts.3.gate_proj", "model.layers.36.mlp.experts.4.gate_proj", "model.layers.36.mlp.experts.5.gate_proj", "model.layers.36.mlp.experts.6.gate_proj", "model.layers.36.mlp.experts.7.gate_proj", "model.layers.36.mlp.experts.8.gate_proj", "model.layers.36.mlp.experts.9.gate_proj", "model.layers.36.mlp.experts.10.gate_proj", "model.layers.36.mlp.experts.11.gate_proj", "model.layers.36.mlp.experts.12.gate_proj", "model.layers.36.mlp.experts.13.gate_proj", "model.layers.36.mlp.experts.14.gate_proj", "model.layers.36.mlp.experts.15.gate_proj", "model.layers.36.mlp.experts.16.gate_proj", "model.layers.36.mlp.experts.17.gate_proj", "model.layers.36.mlp.experts.18.gate_proj", "model.layers.36.mlp.experts.19.gate_proj", "model.layers.36.mlp.experts.20.gate_proj", "model.layers.36.mlp.experts.21.gate_proj", "model.layers.36.mlp.experts.22.gate_proj", "model.layers.36.mlp.experts.23.gate_proj", "model.layers.36.mlp.experts.24.gate_proj", "model.layers.36.mlp.experts.25.gate_proj", "model.layers.36.mlp.experts.26.gate_proj", "model.layers.36.mlp.experts.27.gate_proj", "model.layers.36.mlp.experts.28.gate_proj", "model.layers.36.mlp.experts.29.gate_proj", "model.layers.36.mlp.experts.30.gate_proj", "model.layers.36.mlp.experts.31.gate_proj", "model.layers.36.mlp.experts.32.gate_proj", "model.layers.36.mlp.experts.33.gate_proj", "model.layers.36.mlp.experts.34.gate_proj", "model.layers.36.mlp.experts.35.gate_proj", "model.layers.36.mlp.experts.36.gate_proj", "model.layers.36.mlp.experts.37.gate_proj", "model.layers.36.mlp.experts.38.gate_proj", "model.layers.36.mlp.experts.39.gate_proj", "model.layers.36.mlp.experts.40.gate_proj", "model.layers.36.mlp.experts.41.gate_proj", "model.layers.36.mlp.experts.42.gate_proj", "model.layers.36.mlp.experts.43.gate_proj", "model.layers.36.mlp.experts.44.gate_proj", "model.layers.36.mlp.experts.45.gate_proj", "model.layers.36.mlp.experts.46.gate_proj", "model.layers.36.mlp.experts.47.gate_proj", "model.layers.36.mlp.experts.48.gate_proj", "model.layers.36.mlp.experts.49.gate_proj", "model.layers.36.mlp.experts.50.gate_proj", "model.layers.36.mlp.experts.51.gate_proj", "model.layers.36.mlp.experts.52.gate_proj", "model.layers.36.mlp.experts.53.gate_proj", "model.layers.36.mlp.experts.54.gate_proj", "model.layers.36.mlp.experts.55.gate_proj", "model.layers.36.mlp.experts.56.gate_proj", "model.layers.36.mlp.experts.57.gate_proj", "model.layers.36.mlp.experts.58.gate_proj", "model.layers.36.mlp.experts.59.gate_proj", "model.layers.36.mlp.experts.60.gate_proj", "model.layers.36.mlp.experts.61.gate_proj", "model.layers.36.mlp.experts.62.gate_proj", "model.layers.36.mlp.experts.63.gate_proj", "model.layers.36.mlp.experts.64.gate_proj", "model.layers.36.mlp.experts.65.gate_proj", "model.layers.36.mlp.experts.66.gate_proj", "model.layers.36.mlp.experts.67.gate_proj", "model.layers.36.mlp.experts.68.gate_proj", "model.layers.36.mlp.experts.69.gate_proj", "model.layers.36.mlp.experts.70.gate_proj", "model.layers.36.mlp.experts.71.gate_proj", "model.layers.36.mlp.experts.72.gate_proj", "model.layers.36.mlp.experts.73.gate_proj", "model.layers.36.mlp.experts.74.gate_proj", "model.layers.36.mlp.experts.75.gate_proj", "model.layers.36.mlp.experts.76.gate_proj", "model.layers.36.mlp.experts.77.gate_proj", "model.layers.36.mlp.experts.78.gate_proj", "model.layers.36.mlp.experts.79.gate_proj", "model.layers.36.mlp.experts.80.gate_proj", "model.layers.36.mlp.experts.81.gate_proj", "model.layers.36.mlp.experts.82.gate_proj", "model.layers.36.mlp.experts.83.gate_proj", "model.layers.36.mlp.experts.84.gate_proj", "model.layers.36.mlp.experts.85.gate_proj", "model.layers.36.mlp.experts.86.gate_proj", "model.layers.36.mlp.experts.87.gate_proj", "model.layers.36.mlp.experts.88.gate_proj", "model.layers.36.mlp.experts.89.gate_proj", "model.layers.36.mlp.experts.90.gate_proj", "model.layers.36.mlp.experts.91.gate_proj", "model.layers.36.mlp.experts.92.gate_proj", "model.layers.36.mlp.experts.93.gate_proj", "model.layers.36.mlp.experts.94.gate_proj", "model.layers.36.mlp.experts.95.gate_proj", "model.layers.36.mlp.experts.96.gate_proj", "model.layers.36.mlp.experts.97.gate_proj", "model.layers.36.mlp.experts.98.gate_proj", "model.layers.36.mlp.experts.99.gate_proj", "model.layers.36.mlp.experts.100.gate_proj", "model.layers.36.mlp.experts.101.gate_proj", "model.layers.36.mlp.experts.102.gate_proj", "model.layers.36.mlp.experts.103.gate_proj", "model.layers.36.mlp.experts.104.gate_proj", "model.layers.36.mlp.experts.105.gate_proj", "model.layers.36.mlp.experts.106.gate_proj", "model.layers.36.mlp.experts.107.gate_proj", "model.layers.36.mlp.experts.108.gate_proj", "model.layers.36.mlp.experts.109.gate_proj", "model.layers.36.mlp.experts.110.gate_proj", "model.layers.36.mlp.experts.111.gate_proj", "model.layers.36.mlp.experts.112.gate_proj", "model.layers.36.mlp.experts.113.gate_proj", "model.layers.36.mlp.experts.114.gate_proj", "model.layers.36.mlp.experts.115.gate_proj", "model.layers.36.mlp.experts.116.gate_proj", "model.layers.36.mlp.experts.117.gate_proj", "model.layers.36.mlp.experts.118.gate_proj", "model.layers.36.mlp.experts.119.gate_proj", "model.layers.36.mlp.experts.120.gate_proj", "model.layers.36.mlp.experts.121.gate_proj", "model.layers.36.mlp.experts.122.gate_proj", "model.layers.36.mlp.experts.123.gate_proj", "model.layers.36.mlp.experts.124.gate_proj", "model.layers.36.mlp.experts.125.gate_proj", "model.layers.36.mlp.experts.126.gate_proj", "model.layers.36.mlp.experts.127.gate_proj", "model.layers.36.mlp.experts.128.gate_proj", "model.layers.36.mlp.experts.129.gate_proj", "model.layers.36.mlp.experts.130.gate_proj", "model.layers.36.mlp.experts.131.gate_proj", "model.layers.36.mlp.experts.132.gate_proj", "model.layers.36.mlp.experts.133.gate_proj", "model.layers.36.mlp.experts.134.gate_proj", "model.layers.36.mlp.experts.135.gate_proj", "model.layers.36.mlp.experts.136.gate_proj", "model.layers.36.mlp.experts.137.gate_proj", "model.layers.36.mlp.experts.138.gate_proj", "model.layers.36.mlp.experts.139.gate_proj", "model.layers.36.mlp.experts.140.gate_proj", "model.layers.36.mlp.experts.141.gate_proj", "model.layers.36.mlp.experts.142.gate_proj", "model.layers.36.mlp.experts.143.gate_proj", "model.layers.36.mlp.experts.144.gate_proj", "model.layers.36.mlp.experts.145.gate_proj", "model.layers.36.mlp.experts.146.gate_proj", "model.layers.36.mlp.experts.147.gate_proj", "model.layers.36.mlp.experts.148.gate_proj", "model.layers.36.mlp.experts.149.gate_proj", "model.layers.36.mlp.experts.150.gate_proj", "model.layers.36.mlp.experts.151.gate_proj", "model.layers.36.mlp.experts.152.gate_proj", "model.layers.36.mlp.experts.153.gate_proj", "model.layers.36.mlp.experts.154.gate_proj", "model.layers.36.mlp.experts.155.gate_proj", "model.layers.36.mlp.experts.156.gate_proj", "model.layers.36.mlp.experts.157.gate_proj", "model.layers.36.mlp.experts.158.gate_proj", "model.layers.36.mlp.experts.159.gate_proj", "model.layers.36.mlp.experts.0.up_proj", "model.layers.36.mlp.experts.1.up_proj", "model.layers.36.mlp.experts.2.up_proj", "model.layers.36.mlp.experts.3.up_proj", "model.layers.36.mlp.experts.4.up_proj", "model.layers.36.mlp.experts.5.up_proj", "model.layers.36.mlp.experts.6.up_proj", "model.layers.36.mlp.experts.7.up_proj", "model.layers.36.mlp.experts.8.up_proj", "model.layers.36.mlp.experts.9.up_proj", "model.layers.36.mlp.experts.10.up_proj", "model.layers.36.mlp.experts.11.up_proj", "model.layers.36.mlp.experts.12.up_proj", "model.layers.36.mlp.experts.13.up_proj", "model.layers.36.mlp.experts.14.up_proj", "model.layers.36.mlp.experts.15.up_proj", "model.layers.36.mlp.experts.16.up_proj", "model.layers.36.mlp.experts.17.up_proj", "model.layers.36.mlp.experts.18.up_proj", "model.layers.36.mlp.experts.19.up_proj", "model.layers.36.mlp.experts.20.up_proj", "model.layers.36.mlp.experts.21.up_proj", "model.layers.36.mlp.experts.22.up_proj", "model.layers.36.mlp.experts.23.up_proj", "model.layers.36.mlp.experts.24.up_proj", "model.layers.36.mlp.experts.25.up_proj", "model.layers.36.mlp.experts.26.up_proj", "model.layers.36.mlp.experts.27.up_proj", "model.layers.36.mlp.experts.28.up_proj", "model.layers.36.mlp.experts.29.up_proj", "model.layers.36.mlp.experts.30.up_proj", "model.layers.36.mlp.experts.31.up_proj", "model.layers.36.mlp.experts.32.up_proj", "model.layers.36.mlp.experts.33.up_proj", "model.layers.36.mlp.experts.34.up_proj", "model.layers.36.mlp.experts.35.up_proj", "model.layers.36.mlp.experts.36.up_proj", "model.layers.36.mlp.experts.37.up_proj", "model.layers.36.mlp.experts.38.up_proj", "model.layers.36.mlp.experts.39.up_proj", "model.layers.36.mlp.experts.40.up_proj", "model.layers.36.mlp.experts.41.up_proj", "model.layers.36.mlp.experts.42.up_proj", "model.layers.36.mlp.experts.43.up_proj", "model.layers.36.mlp.experts.44.up_proj", "model.layers.36.mlp.experts.45.up_proj", "model.layers.36.mlp.experts.46.up_proj", "model.layers.36.mlp.experts.47.up_proj", "model.layers.36.mlp.experts.48.up_proj", "model.layers.36.mlp.experts.49.up_proj", "model.layers.36.mlp.experts.50.up_proj", "model.layers.36.mlp.experts.51.up_proj", "model.layers.36.mlp.experts.52.up_proj", "model.layers.36.mlp.experts.53.up_proj", "model.layers.36.mlp.experts.54.up_proj", "model.layers.36.mlp.experts.55.up_proj", "model.layers.36.mlp.experts.56.up_proj", "model.layers.36.mlp.experts.57.up_proj", "model.layers.36.mlp.experts.58.up_proj", "model.layers.36.mlp.experts.59.up_proj", "model.layers.36.mlp.experts.60.up_proj", "model.layers.36.mlp.experts.61.up_proj", "model.layers.36.mlp.experts.62.up_proj", "model.layers.36.mlp.experts.63.up_proj", "model.layers.36.mlp.experts.64.up_proj", "model.layers.36.mlp.experts.65.up_proj", "model.layers.36.mlp.experts.66.up_proj", "model.layers.36.mlp.experts.67.up_proj", "model.layers.36.mlp.experts.68.up_proj", "model.layers.36.mlp.experts.69.up_proj", "model.layers.36.mlp.experts.70.up_proj", "model.layers.36.mlp.experts.71.up_proj", "model.layers.36.mlp.experts.72.up_proj", "model.layers.36.mlp.experts.73.up_proj", "model.layers.36.mlp.experts.74.up_proj", "model.layers.36.mlp.experts.75.up_proj", "model.layers.36.mlp.experts.76.up_proj", "model.layers.36.mlp.experts.77.up_proj", "model.layers.36.mlp.experts.78.up_proj", "model.layers.36.mlp.experts.79.up_proj", "model.layers.36.mlp.experts.80.up_proj", "model.layers.36.mlp.experts.81.up_proj", "model.layers.36.mlp.experts.82.up_proj", "model.layers.36.mlp.experts.83.up_proj", "model.layers.36.mlp.experts.84.up_proj", "model.layers.36.mlp.experts.85.up_proj", "model.layers.36.mlp.experts.86.up_proj", "model.layers.36.mlp.experts.87.up_proj", "model.layers.36.mlp.experts.88.up_proj", "model.layers.36.mlp.experts.89.up_proj", "model.layers.36.mlp.experts.90.up_proj", "model.layers.36.mlp.experts.91.up_proj", "model.layers.36.mlp.experts.92.up_proj", "model.layers.36.mlp.experts.93.up_proj", "model.layers.36.mlp.experts.94.up_proj", "model.layers.36.mlp.experts.95.up_proj", "model.layers.36.mlp.experts.96.up_proj", "model.layers.36.mlp.experts.97.up_proj", "model.layers.36.mlp.experts.98.up_proj", "model.layers.36.mlp.experts.99.up_proj", "model.layers.36.mlp.experts.100.up_proj", "model.layers.36.mlp.experts.101.up_proj", "model.layers.36.mlp.experts.102.up_proj", "model.layers.36.mlp.experts.103.up_proj", "model.layers.36.mlp.experts.104.up_proj", "model.layers.36.mlp.experts.105.up_proj", "model.layers.36.mlp.experts.106.up_proj", "model.layers.36.mlp.experts.107.up_proj", "model.layers.36.mlp.experts.108.up_proj", "model.layers.36.mlp.experts.109.up_proj", "model.layers.36.mlp.experts.110.up_proj", "model.layers.36.mlp.experts.111.up_proj", "model.layers.36.mlp.experts.112.up_proj", "model.layers.36.mlp.experts.113.up_proj", "model.layers.36.mlp.experts.114.up_proj", "model.layers.36.mlp.experts.115.up_proj", "model.layers.36.mlp.experts.116.up_proj", "model.layers.36.mlp.experts.117.up_proj", "model.layers.36.mlp.experts.118.up_proj", "model.layers.36.mlp.experts.119.up_proj", "model.layers.36.mlp.experts.120.up_proj", "model.layers.36.mlp.experts.121.up_proj", "model.layers.36.mlp.experts.122.up_proj", "model.layers.36.mlp.experts.123.up_proj", "model.layers.36.mlp.experts.124.up_proj", "model.layers.36.mlp.experts.125.up_proj", "model.layers.36.mlp.experts.126.up_proj", "model.layers.36.mlp.experts.127.up_proj", "model.layers.36.mlp.experts.128.up_proj", "model.layers.36.mlp.experts.129.up_proj", "model.layers.36.mlp.experts.130.up_proj", "model.layers.36.mlp.experts.131.up_proj", "model.layers.36.mlp.experts.132.up_proj", "model.layers.36.mlp.experts.133.up_proj", "model.layers.36.mlp.experts.134.up_proj", "model.layers.36.mlp.experts.135.up_proj", "model.layers.36.mlp.experts.136.up_proj", "model.layers.36.mlp.experts.137.up_proj", "model.layers.36.mlp.experts.138.up_proj", "model.layers.36.mlp.experts.139.up_proj", "model.layers.36.mlp.experts.140.up_proj", "model.layers.36.mlp.experts.141.up_proj", "model.layers.36.mlp.experts.142.up_proj", "model.layers.36.mlp.experts.143.up_proj", "model.layers.36.mlp.experts.144.up_proj", "model.layers.36.mlp.experts.145.up_proj", "model.layers.36.mlp.experts.146.up_proj", "model.layers.36.mlp.experts.147.up_proj", "model.layers.36.mlp.experts.148.up_proj", "model.layers.36.mlp.experts.149.up_proj", "model.layers.36.mlp.experts.150.up_proj", "model.layers.36.mlp.experts.151.up_proj", "model.layers.36.mlp.experts.152.up_proj", "model.layers.36.mlp.experts.153.up_proj", "model.layers.36.mlp.experts.154.up_proj", "model.layers.36.mlp.experts.155.up_proj", "model.layers.36.mlp.experts.156.up_proj", "model.layers.36.mlp.experts.157.up_proj", "model.layers.36.mlp.experts.158.up_proj", "model.layers.36.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -7.09703890606761e-05, "dbits": 2516582400 }, { "dkld": -6.490945816040039e-05, "dbits": 5033164800 } ] }, { "idx": 218, "layers": [ "model.layers.36.mlp.experts.0.down_proj", "model.layers.36.mlp.experts.1.down_proj", "model.layers.36.mlp.experts.2.down_proj", "model.layers.36.mlp.experts.3.down_proj", "model.layers.36.mlp.experts.4.down_proj", "model.layers.36.mlp.experts.5.down_proj", "model.layers.36.mlp.experts.6.down_proj", "model.layers.36.mlp.experts.7.down_proj", "model.layers.36.mlp.experts.8.down_proj", "model.layers.36.mlp.experts.9.down_proj", "model.layers.36.mlp.experts.10.down_proj", "model.layers.36.mlp.experts.11.down_proj", "model.layers.36.mlp.experts.12.down_proj", "model.layers.36.mlp.experts.13.down_proj", "model.layers.36.mlp.experts.14.down_proj", "model.layers.36.mlp.experts.15.down_proj", "model.layers.36.mlp.experts.16.down_proj", "model.layers.36.mlp.experts.17.down_proj", "model.layers.36.mlp.experts.18.down_proj", "model.layers.36.mlp.experts.19.down_proj", "model.layers.36.mlp.experts.20.down_proj", "model.layers.36.mlp.experts.21.down_proj", "model.layers.36.mlp.experts.22.down_proj", "model.layers.36.mlp.experts.23.down_proj", "model.layers.36.mlp.experts.24.down_proj", "model.layers.36.mlp.experts.25.down_proj", "model.layers.36.mlp.experts.26.down_proj", "model.layers.36.mlp.experts.27.down_proj", "model.layers.36.mlp.experts.28.down_proj", "model.layers.36.mlp.experts.29.down_proj", "model.layers.36.mlp.experts.30.down_proj", "model.layers.36.mlp.experts.31.down_proj", "model.layers.36.mlp.experts.32.down_proj", "model.layers.36.mlp.experts.33.down_proj", "model.layers.36.mlp.experts.34.down_proj", "model.layers.36.mlp.experts.35.down_proj", "model.layers.36.mlp.experts.36.down_proj", "model.layers.36.mlp.experts.37.down_proj", "model.layers.36.mlp.experts.38.down_proj", "model.layers.36.mlp.experts.39.down_proj", "model.layers.36.mlp.experts.40.down_proj", "model.layers.36.mlp.experts.41.down_proj", "model.layers.36.mlp.experts.42.down_proj", "model.layers.36.mlp.experts.43.down_proj", "model.layers.36.mlp.experts.44.down_proj", "model.layers.36.mlp.experts.45.down_proj", "model.layers.36.mlp.experts.46.down_proj", "model.layers.36.mlp.experts.47.down_proj", "model.layers.36.mlp.experts.48.down_proj", "model.layers.36.mlp.experts.49.down_proj", "model.layers.36.mlp.experts.50.down_proj", "model.layers.36.mlp.experts.51.down_proj", "model.layers.36.mlp.experts.52.down_proj", "model.layers.36.mlp.experts.53.down_proj", "model.layers.36.mlp.experts.54.down_proj", "model.layers.36.mlp.experts.55.down_proj", "model.layers.36.mlp.experts.56.down_proj", "model.layers.36.mlp.experts.57.down_proj", "model.layers.36.mlp.experts.58.down_proj", "model.layers.36.mlp.experts.59.down_proj", "model.layers.36.mlp.experts.60.down_proj", "model.layers.36.mlp.experts.61.down_proj", "model.layers.36.mlp.experts.62.down_proj", "model.layers.36.mlp.experts.63.down_proj", "model.layers.36.mlp.experts.64.down_proj", "model.layers.36.mlp.experts.65.down_proj", "model.layers.36.mlp.experts.66.down_proj", "model.layers.36.mlp.experts.67.down_proj", "model.layers.36.mlp.experts.68.down_proj", "model.layers.36.mlp.experts.69.down_proj", "model.layers.36.mlp.experts.70.down_proj", "model.layers.36.mlp.experts.71.down_proj", "model.layers.36.mlp.experts.72.down_proj", "model.layers.36.mlp.experts.73.down_proj", "model.layers.36.mlp.experts.74.down_proj", "model.layers.36.mlp.experts.75.down_proj", "model.layers.36.mlp.experts.76.down_proj", "model.layers.36.mlp.experts.77.down_proj", "model.layers.36.mlp.experts.78.down_proj", "model.layers.36.mlp.experts.79.down_proj", "model.layers.36.mlp.experts.80.down_proj", "model.layers.36.mlp.experts.81.down_proj", "model.layers.36.mlp.experts.82.down_proj", "model.layers.36.mlp.experts.83.down_proj", "model.layers.36.mlp.experts.84.down_proj", "model.layers.36.mlp.experts.85.down_proj", "model.layers.36.mlp.experts.86.down_proj", "model.layers.36.mlp.experts.87.down_proj", "model.layers.36.mlp.experts.88.down_proj", "model.layers.36.mlp.experts.89.down_proj", "model.layers.36.mlp.experts.90.down_proj", "model.layers.36.mlp.experts.91.down_proj", "model.layers.36.mlp.experts.92.down_proj", "model.layers.36.mlp.experts.93.down_proj", "model.layers.36.mlp.experts.94.down_proj", "model.layers.36.mlp.experts.95.down_proj", "model.layers.36.mlp.experts.96.down_proj", "model.layers.36.mlp.experts.97.down_proj", "model.layers.36.mlp.experts.98.down_proj", "model.layers.36.mlp.experts.99.down_proj", "model.layers.36.mlp.experts.100.down_proj", "model.layers.36.mlp.experts.101.down_proj", "model.layers.36.mlp.experts.102.down_proj", "model.layers.36.mlp.experts.103.down_proj", "model.layers.36.mlp.experts.104.down_proj", "model.layers.36.mlp.experts.105.down_proj", "model.layers.36.mlp.experts.106.down_proj", "model.layers.36.mlp.experts.107.down_proj", "model.layers.36.mlp.experts.108.down_proj", "model.layers.36.mlp.experts.109.down_proj", "model.layers.36.mlp.experts.110.down_proj", "model.layers.36.mlp.experts.111.down_proj", "model.layers.36.mlp.experts.112.down_proj", "model.layers.36.mlp.experts.113.down_proj", "model.layers.36.mlp.experts.114.down_proj", "model.layers.36.mlp.experts.115.down_proj", "model.layers.36.mlp.experts.116.down_proj", "model.layers.36.mlp.experts.117.down_proj", "model.layers.36.mlp.experts.118.down_proj", "model.layers.36.mlp.experts.119.down_proj", "model.layers.36.mlp.experts.120.down_proj", "model.layers.36.mlp.experts.121.down_proj", "model.layers.36.mlp.experts.122.down_proj", "model.layers.36.mlp.experts.123.down_proj", "model.layers.36.mlp.experts.124.down_proj", "model.layers.36.mlp.experts.125.down_proj", "model.layers.36.mlp.experts.126.down_proj", "model.layers.36.mlp.experts.127.down_proj", "model.layers.36.mlp.experts.128.down_proj", "model.layers.36.mlp.experts.129.down_proj", "model.layers.36.mlp.experts.130.down_proj", "model.layers.36.mlp.experts.131.down_proj", "model.layers.36.mlp.experts.132.down_proj", "model.layers.36.mlp.experts.133.down_proj", "model.layers.36.mlp.experts.134.down_proj", "model.layers.36.mlp.experts.135.down_proj", "model.layers.36.mlp.experts.136.down_proj", "model.layers.36.mlp.experts.137.down_proj", "model.layers.36.mlp.experts.138.down_proj", "model.layers.36.mlp.experts.139.down_proj", "model.layers.36.mlp.experts.140.down_proj", "model.layers.36.mlp.experts.141.down_proj", "model.layers.36.mlp.experts.142.down_proj", "model.layers.36.mlp.experts.143.down_proj", "model.layers.36.mlp.experts.144.down_proj", "model.layers.36.mlp.experts.145.down_proj", "model.layers.36.mlp.experts.146.down_proj", "model.layers.36.mlp.experts.147.down_proj", "model.layers.36.mlp.experts.148.down_proj", "model.layers.36.mlp.experts.149.down_proj", "model.layers.36.mlp.experts.150.down_proj", "model.layers.36.mlp.experts.151.down_proj", "model.layers.36.mlp.experts.152.down_proj", "model.layers.36.mlp.experts.153.down_proj", "model.layers.36.mlp.experts.154.down_proj", "model.layers.36.mlp.experts.155.down_proj", "model.layers.36.mlp.experts.156.down_proj", "model.layers.36.mlp.experts.157.down_proj", "model.layers.36.mlp.experts.158.down_proj", "model.layers.36.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -5.566223990172148e-05, "dbits": 1258291200 }, { "dkld": -6.74748094752417e-05, "dbits": 2516582400 } ] }, { "idx": 219, "layers": [ "model.layers.37.self_attn.q_proj" ], "candidates": [ { "dkld": 6.436654366552899e-05, "dbits": 62914560 }, { "dkld": 5.0728744827211944e-05, "dbits": 125829120 } ] }, { "idx": 220, "layers": [ "model.layers.37.self_attn.k_proj", "model.layers.37.self_attn.v_proj" ], "candidates": [ { "dkld": -0.00015153482090681653, "dbits": 10485760 }, { "dkld": -4.267545882612363e-05, "dbits": 20971520 } ] }, { "idx": 221, "layers": [ "model.layers.37.self_attn.o_proj" ], "candidates": [ { "dkld": 5.9670978225769e-05, "dbits": 62914560 }, { "dkld": 6.110297981649741e-05, "dbits": 125829120 } ] }, { "idx": 222, "layers": [ "model.layers.37.mlp.shared_experts.gate_proj", "model.layers.37.mlp.shared_experts.up_proj", "model.layers.37.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 1.9126804545521736e-05, "dbits": 23592960 }, { "dkld": -7.800809107720748e-05, "dbits": 47185920 } ] }, { "idx": 223, "layers": [ "model.layers.37.mlp.experts.0.gate_proj", "model.layers.37.mlp.experts.1.gate_proj", "model.layers.37.mlp.experts.2.gate_proj", "model.layers.37.mlp.experts.3.gate_proj", "model.layers.37.mlp.experts.4.gate_proj", "model.layers.37.mlp.experts.5.gate_proj", "model.layers.37.mlp.experts.6.gate_proj", "model.layers.37.mlp.experts.7.gate_proj", "model.layers.37.mlp.experts.8.gate_proj", "model.layers.37.mlp.experts.9.gate_proj", "model.layers.37.mlp.experts.10.gate_proj", "model.layers.37.mlp.experts.11.gate_proj", "model.layers.37.mlp.experts.12.gate_proj", "model.layers.37.mlp.experts.13.gate_proj", "model.layers.37.mlp.experts.14.gate_proj", "model.layers.37.mlp.experts.15.gate_proj", "model.layers.37.mlp.experts.16.gate_proj", "model.layers.37.mlp.experts.17.gate_proj", "model.layers.37.mlp.experts.18.gate_proj", "model.layers.37.mlp.experts.19.gate_proj", "model.layers.37.mlp.experts.20.gate_proj", "model.layers.37.mlp.experts.21.gate_proj", "model.layers.37.mlp.experts.22.gate_proj", "model.layers.37.mlp.experts.23.gate_proj", "model.layers.37.mlp.experts.24.gate_proj", "model.layers.37.mlp.experts.25.gate_proj", "model.layers.37.mlp.experts.26.gate_proj", "model.layers.37.mlp.experts.27.gate_proj", "model.layers.37.mlp.experts.28.gate_proj", "model.layers.37.mlp.experts.29.gate_proj", "model.layers.37.mlp.experts.30.gate_proj", "model.layers.37.mlp.experts.31.gate_proj", "model.layers.37.mlp.experts.32.gate_proj", "model.layers.37.mlp.experts.33.gate_proj", "model.layers.37.mlp.experts.34.gate_proj", "model.layers.37.mlp.experts.35.gate_proj", "model.layers.37.mlp.experts.36.gate_proj", "model.layers.37.mlp.experts.37.gate_proj", "model.layers.37.mlp.experts.38.gate_proj", "model.layers.37.mlp.experts.39.gate_proj", "model.layers.37.mlp.experts.40.gate_proj", "model.layers.37.mlp.experts.41.gate_proj", "model.layers.37.mlp.experts.42.gate_proj", "model.layers.37.mlp.experts.43.gate_proj", "model.layers.37.mlp.experts.44.gate_proj", "model.layers.37.mlp.experts.45.gate_proj", "model.layers.37.mlp.experts.46.gate_proj", "model.layers.37.mlp.experts.47.gate_proj", "model.layers.37.mlp.experts.48.gate_proj", "model.layers.37.mlp.experts.49.gate_proj", "model.layers.37.mlp.experts.50.gate_proj", "model.layers.37.mlp.experts.51.gate_proj", "model.layers.37.mlp.experts.52.gate_proj", "model.layers.37.mlp.experts.53.gate_proj", "model.layers.37.mlp.experts.54.gate_proj", "model.layers.37.mlp.experts.55.gate_proj", "model.layers.37.mlp.experts.56.gate_proj", "model.layers.37.mlp.experts.57.gate_proj", "model.layers.37.mlp.experts.58.gate_proj", "model.layers.37.mlp.experts.59.gate_proj", "model.layers.37.mlp.experts.60.gate_proj", "model.layers.37.mlp.experts.61.gate_proj", "model.layers.37.mlp.experts.62.gate_proj", "model.layers.37.mlp.experts.63.gate_proj", "model.layers.37.mlp.experts.64.gate_proj", "model.layers.37.mlp.experts.65.gate_proj", "model.layers.37.mlp.experts.66.gate_proj", "model.layers.37.mlp.experts.67.gate_proj", "model.layers.37.mlp.experts.68.gate_proj", "model.layers.37.mlp.experts.69.gate_proj", "model.layers.37.mlp.experts.70.gate_proj", "model.layers.37.mlp.experts.71.gate_proj", "model.layers.37.mlp.experts.72.gate_proj", "model.layers.37.mlp.experts.73.gate_proj", "model.layers.37.mlp.experts.74.gate_proj", "model.layers.37.mlp.experts.75.gate_proj", "model.layers.37.mlp.experts.76.gate_proj", "model.layers.37.mlp.experts.77.gate_proj", "model.layers.37.mlp.experts.78.gate_proj", "model.layers.37.mlp.experts.79.gate_proj", "model.layers.37.mlp.experts.80.gate_proj", "model.layers.37.mlp.experts.81.gate_proj", "model.layers.37.mlp.experts.82.gate_proj", "model.layers.37.mlp.experts.83.gate_proj", "model.layers.37.mlp.experts.84.gate_proj", "model.layers.37.mlp.experts.85.gate_proj", "model.layers.37.mlp.experts.86.gate_proj", "model.layers.37.mlp.experts.87.gate_proj", "model.layers.37.mlp.experts.88.gate_proj", "model.layers.37.mlp.experts.89.gate_proj", "model.layers.37.mlp.experts.90.gate_proj", "model.layers.37.mlp.experts.91.gate_proj", "model.layers.37.mlp.experts.92.gate_proj", "model.layers.37.mlp.experts.93.gate_proj", "model.layers.37.mlp.experts.94.gate_proj", "model.layers.37.mlp.experts.95.gate_proj", "model.layers.37.mlp.experts.96.gate_proj", "model.layers.37.mlp.experts.97.gate_proj", "model.layers.37.mlp.experts.98.gate_proj", "model.layers.37.mlp.experts.99.gate_proj", "model.layers.37.mlp.experts.100.gate_proj", "model.layers.37.mlp.experts.101.gate_proj", "model.layers.37.mlp.experts.102.gate_proj", "model.layers.37.mlp.experts.103.gate_proj", "model.layers.37.mlp.experts.104.gate_proj", "model.layers.37.mlp.experts.105.gate_proj", "model.layers.37.mlp.experts.106.gate_proj", "model.layers.37.mlp.experts.107.gate_proj", "model.layers.37.mlp.experts.108.gate_proj", "model.layers.37.mlp.experts.109.gate_proj", "model.layers.37.mlp.experts.110.gate_proj", "model.layers.37.mlp.experts.111.gate_proj", "model.layers.37.mlp.experts.112.gate_proj", "model.layers.37.mlp.experts.113.gate_proj", "model.layers.37.mlp.experts.114.gate_proj", "model.layers.37.mlp.experts.115.gate_proj", "model.layers.37.mlp.experts.116.gate_proj", "model.layers.37.mlp.experts.117.gate_proj", "model.layers.37.mlp.experts.118.gate_proj", "model.layers.37.mlp.experts.119.gate_proj", "model.layers.37.mlp.experts.120.gate_proj", "model.layers.37.mlp.experts.121.gate_proj", "model.layers.37.mlp.experts.122.gate_proj", "model.layers.37.mlp.experts.123.gate_proj", "model.layers.37.mlp.experts.124.gate_proj", "model.layers.37.mlp.experts.125.gate_proj", "model.layers.37.mlp.experts.126.gate_proj", "model.layers.37.mlp.experts.127.gate_proj", "model.layers.37.mlp.experts.128.gate_proj", "model.layers.37.mlp.experts.129.gate_proj", "model.layers.37.mlp.experts.130.gate_proj", "model.layers.37.mlp.experts.131.gate_proj", "model.layers.37.mlp.experts.132.gate_proj", "model.layers.37.mlp.experts.133.gate_proj", "model.layers.37.mlp.experts.134.gate_proj", "model.layers.37.mlp.experts.135.gate_proj", "model.layers.37.mlp.experts.136.gate_proj", "model.layers.37.mlp.experts.137.gate_proj", "model.layers.37.mlp.experts.138.gate_proj", "model.layers.37.mlp.experts.139.gate_proj", "model.layers.37.mlp.experts.140.gate_proj", "model.layers.37.mlp.experts.141.gate_proj", "model.layers.37.mlp.experts.142.gate_proj", "model.layers.37.mlp.experts.143.gate_proj", "model.layers.37.mlp.experts.144.gate_proj", "model.layers.37.mlp.experts.145.gate_proj", "model.layers.37.mlp.experts.146.gate_proj", "model.layers.37.mlp.experts.147.gate_proj", "model.layers.37.mlp.experts.148.gate_proj", "model.layers.37.mlp.experts.149.gate_proj", "model.layers.37.mlp.experts.150.gate_proj", "model.layers.37.mlp.experts.151.gate_proj", "model.layers.37.mlp.experts.152.gate_proj", "model.layers.37.mlp.experts.153.gate_proj", "model.layers.37.mlp.experts.154.gate_proj", "model.layers.37.mlp.experts.155.gate_proj", "model.layers.37.mlp.experts.156.gate_proj", "model.layers.37.mlp.experts.157.gate_proj", "model.layers.37.mlp.experts.158.gate_proj", "model.layers.37.mlp.experts.159.gate_proj", "model.layers.37.mlp.experts.0.up_proj", "model.layers.37.mlp.experts.1.up_proj", "model.layers.37.mlp.experts.2.up_proj", "model.layers.37.mlp.experts.3.up_proj", "model.layers.37.mlp.experts.4.up_proj", "model.layers.37.mlp.experts.5.up_proj", "model.layers.37.mlp.experts.6.up_proj", "model.layers.37.mlp.experts.7.up_proj", "model.layers.37.mlp.experts.8.up_proj", "model.layers.37.mlp.experts.9.up_proj", "model.layers.37.mlp.experts.10.up_proj", "model.layers.37.mlp.experts.11.up_proj", "model.layers.37.mlp.experts.12.up_proj", "model.layers.37.mlp.experts.13.up_proj", "model.layers.37.mlp.experts.14.up_proj", "model.layers.37.mlp.experts.15.up_proj", "model.layers.37.mlp.experts.16.up_proj", "model.layers.37.mlp.experts.17.up_proj", "model.layers.37.mlp.experts.18.up_proj", "model.layers.37.mlp.experts.19.up_proj", "model.layers.37.mlp.experts.20.up_proj", "model.layers.37.mlp.experts.21.up_proj", "model.layers.37.mlp.experts.22.up_proj", "model.layers.37.mlp.experts.23.up_proj", "model.layers.37.mlp.experts.24.up_proj", "model.layers.37.mlp.experts.25.up_proj", "model.layers.37.mlp.experts.26.up_proj", "model.layers.37.mlp.experts.27.up_proj", "model.layers.37.mlp.experts.28.up_proj", "model.layers.37.mlp.experts.29.up_proj", "model.layers.37.mlp.experts.30.up_proj", "model.layers.37.mlp.experts.31.up_proj", "model.layers.37.mlp.experts.32.up_proj", "model.layers.37.mlp.experts.33.up_proj", "model.layers.37.mlp.experts.34.up_proj", "model.layers.37.mlp.experts.35.up_proj", "model.layers.37.mlp.experts.36.up_proj", "model.layers.37.mlp.experts.37.up_proj", "model.layers.37.mlp.experts.38.up_proj", "model.layers.37.mlp.experts.39.up_proj", "model.layers.37.mlp.experts.40.up_proj", "model.layers.37.mlp.experts.41.up_proj", "model.layers.37.mlp.experts.42.up_proj", "model.layers.37.mlp.experts.43.up_proj", "model.layers.37.mlp.experts.44.up_proj", "model.layers.37.mlp.experts.45.up_proj", "model.layers.37.mlp.experts.46.up_proj", "model.layers.37.mlp.experts.47.up_proj", "model.layers.37.mlp.experts.48.up_proj", "model.layers.37.mlp.experts.49.up_proj", "model.layers.37.mlp.experts.50.up_proj", "model.layers.37.mlp.experts.51.up_proj", "model.layers.37.mlp.experts.52.up_proj", "model.layers.37.mlp.experts.53.up_proj", "model.layers.37.mlp.experts.54.up_proj", "model.layers.37.mlp.experts.55.up_proj", "model.layers.37.mlp.experts.56.up_proj", "model.layers.37.mlp.experts.57.up_proj", "model.layers.37.mlp.experts.58.up_proj", "model.layers.37.mlp.experts.59.up_proj", "model.layers.37.mlp.experts.60.up_proj", "model.layers.37.mlp.experts.61.up_proj", "model.layers.37.mlp.experts.62.up_proj", "model.layers.37.mlp.experts.63.up_proj", "model.layers.37.mlp.experts.64.up_proj", "model.layers.37.mlp.experts.65.up_proj", "model.layers.37.mlp.experts.66.up_proj", "model.layers.37.mlp.experts.67.up_proj", "model.layers.37.mlp.experts.68.up_proj", "model.layers.37.mlp.experts.69.up_proj", "model.layers.37.mlp.experts.70.up_proj", "model.layers.37.mlp.experts.71.up_proj", "model.layers.37.mlp.experts.72.up_proj", "model.layers.37.mlp.experts.73.up_proj", "model.layers.37.mlp.experts.74.up_proj", "model.layers.37.mlp.experts.75.up_proj", "model.layers.37.mlp.experts.76.up_proj", "model.layers.37.mlp.experts.77.up_proj", "model.layers.37.mlp.experts.78.up_proj", "model.layers.37.mlp.experts.79.up_proj", "model.layers.37.mlp.experts.80.up_proj", "model.layers.37.mlp.experts.81.up_proj", "model.layers.37.mlp.experts.82.up_proj", "model.layers.37.mlp.experts.83.up_proj", "model.layers.37.mlp.experts.84.up_proj", "model.layers.37.mlp.experts.85.up_proj", "model.layers.37.mlp.experts.86.up_proj", "model.layers.37.mlp.experts.87.up_proj", "model.layers.37.mlp.experts.88.up_proj", "model.layers.37.mlp.experts.89.up_proj", "model.layers.37.mlp.experts.90.up_proj", "model.layers.37.mlp.experts.91.up_proj", "model.layers.37.mlp.experts.92.up_proj", "model.layers.37.mlp.experts.93.up_proj", "model.layers.37.mlp.experts.94.up_proj", "model.layers.37.mlp.experts.95.up_proj", "model.layers.37.mlp.experts.96.up_proj", "model.layers.37.mlp.experts.97.up_proj", "model.layers.37.mlp.experts.98.up_proj", "model.layers.37.mlp.experts.99.up_proj", "model.layers.37.mlp.experts.100.up_proj", "model.layers.37.mlp.experts.101.up_proj", "model.layers.37.mlp.experts.102.up_proj", "model.layers.37.mlp.experts.103.up_proj", "model.layers.37.mlp.experts.104.up_proj", "model.layers.37.mlp.experts.105.up_proj", "model.layers.37.mlp.experts.106.up_proj", "model.layers.37.mlp.experts.107.up_proj", "model.layers.37.mlp.experts.108.up_proj", "model.layers.37.mlp.experts.109.up_proj", "model.layers.37.mlp.experts.110.up_proj", "model.layers.37.mlp.experts.111.up_proj", "model.layers.37.mlp.experts.112.up_proj", "model.layers.37.mlp.experts.113.up_proj", "model.layers.37.mlp.experts.114.up_proj", "model.layers.37.mlp.experts.115.up_proj", "model.layers.37.mlp.experts.116.up_proj", "model.layers.37.mlp.experts.117.up_proj", "model.layers.37.mlp.experts.118.up_proj", "model.layers.37.mlp.experts.119.up_proj", "model.layers.37.mlp.experts.120.up_proj", "model.layers.37.mlp.experts.121.up_proj", "model.layers.37.mlp.experts.122.up_proj", "model.layers.37.mlp.experts.123.up_proj", "model.layers.37.mlp.experts.124.up_proj", "model.layers.37.mlp.experts.125.up_proj", "model.layers.37.mlp.experts.126.up_proj", "model.layers.37.mlp.experts.127.up_proj", "model.layers.37.mlp.experts.128.up_proj", "model.layers.37.mlp.experts.129.up_proj", "model.layers.37.mlp.experts.130.up_proj", "model.layers.37.mlp.experts.131.up_proj", "model.layers.37.mlp.experts.132.up_proj", "model.layers.37.mlp.experts.133.up_proj", "model.layers.37.mlp.experts.134.up_proj", "model.layers.37.mlp.experts.135.up_proj", "model.layers.37.mlp.experts.136.up_proj", "model.layers.37.mlp.experts.137.up_proj", "model.layers.37.mlp.experts.138.up_proj", "model.layers.37.mlp.experts.139.up_proj", "model.layers.37.mlp.experts.140.up_proj", "model.layers.37.mlp.experts.141.up_proj", "model.layers.37.mlp.experts.142.up_proj", "model.layers.37.mlp.experts.143.up_proj", "model.layers.37.mlp.experts.144.up_proj", "model.layers.37.mlp.experts.145.up_proj", "model.layers.37.mlp.experts.146.up_proj", "model.layers.37.mlp.experts.147.up_proj", "model.layers.37.mlp.experts.148.up_proj", "model.layers.37.mlp.experts.149.up_proj", "model.layers.37.mlp.experts.150.up_proj", "model.layers.37.mlp.experts.151.up_proj", "model.layers.37.mlp.experts.152.up_proj", "model.layers.37.mlp.experts.153.up_proj", "model.layers.37.mlp.experts.154.up_proj", "model.layers.37.mlp.experts.155.up_proj", "model.layers.37.mlp.experts.156.up_proj", "model.layers.37.mlp.experts.157.up_proj", "model.layers.37.mlp.experts.158.up_proj", "model.layers.37.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.1012051254510533e-05, "dbits": 2516582400 }, { "dkld": -2.2852839902042302e-05, "dbits": 5033164800 } ] }, { "idx": 224, "layers": [ "model.layers.37.mlp.experts.0.down_proj", "model.layers.37.mlp.experts.1.down_proj", "model.layers.37.mlp.experts.2.down_proj", "model.layers.37.mlp.experts.3.down_proj", "model.layers.37.mlp.experts.4.down_proj", "model.layers.37.mlp.experts.5.down_proj", "model.layers.37.mlp.experts.6.down_proj", "model.layers.37.mlp.experts.7.down_proj", "model.layers.37.mlp.experts.8.down_proj", "model.layers.37.mlp.experts.9.down_proj", "model.layers.37.mlp.experts.10.down_proj", "model.layers.37.mlp.experts.11.down_proj", "model.layers.37.mlp.experts.12.down_proj", "model.layers.37.mlp.experts.13.down_proj", "model.layers.37.mlp.experts.14.down_proj", "model.layers.37.mlp.experts.15.down_proj", "model.layers.37.mlp.experts.16.down_proj", "model.layers.37.mlp.experts.17.down_proj", "model.layers.37.mlp.experts.18.down_proj", "model.layers.37.mlp.experts.19.down_proj", "model.layers.37.mlp.experts.20.down_proj", "model.layers.37.mlp.experts.21.down_proj", "model.layers.37.mlp.experts.22.down_proj", "model.layers.37.mlp.experts.23.down_proj", "model.layers.37.mlp.experts.24.down_proj", "model.layers.37.mlp.experts.25.down_proj", "model.layers.37.mlp.experts.26.down_proj", "model.layers.37.mlp.experts.27.down_proj", "model.layers.37.mlp.experts.28.down_proj", "model.layers.37.mlp.experts.29.down_proj", "model.layers.37.mlp.experts.30.down_proj", "model.layers.37.mlp.experts.31.down_proj", "model.layers.37.mlp.experts.32.down_proj", "model.layers.37.mlp.experts.33.down_proj", "model.layers.37.mlp.experts.34.down_proj", "model.layers.37.mlp.experts.35.down_proj", "model.layers.37.mlp.experts.36.down_proj", "model.layers.37.mlp.experts.37.down_proj", "model.layers.37.mlp.experts.38.down_proj", "model.layers.37.mlp.experts.39.down_proj", "model.layers.37.mlp.experts.40.down_proj", "model.layers.37.mlp.experts.41.down_proj", "model.layers.37.mlp.experts.42.down_proj", "model.layers.37.mlp.experts.43.down_proj", "model.layers.37.mlp.experts.44.down_proj", "model.layers.37.mlp.experts.45.down_proj", "model.layers.37.mlp.experts.46.down_proj", "model.layers.37.mlp.experts.47.down_proj", "model.layers.37.mlp.experts.48.down_proj", "model.layers.37.mlp.experts.49.down_proj", "model.layers.37.mlp.experts.50.down_proj", "model.layers.37.mlp.experts.51.down_proj", "model.layers.37.mlp.experts.52.down_proj", "model.layers.37.mlp.experts.53.down_proj", "model.layers.37.mlp.experts.54.down_proj", "model.layers.37.mlp.experts.55.down_proj", "model.layers.37.mlp.experts.56.down_proj", "model.layers.37.mlp.experts.57.down_proj", "model.layers.37.mlp.experts.58.down_proj", "model.layers.37.mlp.experts.59.down_proj", "model.layers.37.mlp.experts.60.down_proj", "model.layers.37.mlp.experts.61.down_proj", "model.layers.37.mlp.experts.62.down_proj", "model.layers.37.mlp.experts.63.down_proj", "model.layers.37.mlp.experts.64.down_proj", "model.layers.37.mlp.experts.65.down_proj", "model.layers.37.mlp.experts.66.down_proj", "model.layers.37.mlp.experts.67.down_proj", "model.layers.37.mlp.experts.68.down_proj", "model.layers.37.mlp.experts.69.down_proj", "model.layers.37.mlp.experts.70.down_proj", "model.layers.37.mlp.experts.71.down_proj", "model.layers.37.mlp.experts.72.down_proj", "model.layers.37.mlp.experts.73.down_proj", "model.layers.37.mlp.experts.74.down_proj", "model.layers.37.mlp.experts.75.down_proj", "model.layers.37.mlp.experts.76.down_proj", "model.layers.37.mlp.experts.77.down_proj", "model.layers.37.mlp.experts.78.down_proj", "model.layers.37.mlp.experts.79.down_proj", "model.layers.37.mlp.experts.80.down_proj", "model.layers.37.mlp.experts.81.down_proj", "model.layers.37.mlp.experts.82.down_proj", "model.layers.37.mlp.experts.83.down_proj", "model.layers.37.mlp.experts.84.down_proj", "model.layers.37.mlp.experts.85.down_proj", "model.layers.37.mlp.experts.86.down_proj", "model.layers.37.mlp.experts.87.down_proj", "model.layers.37.mlp.experts.88.down_proj", "model.layers.37.mlp.experts.89.down_proj", "model.layers.37.mlp.experts.90.down_proj", "model.layers.37.mlp.experts.91.down_proj", "model.layers.37.mlp.experts.92.down_proj", "model.layers.37.mlp.experts.93.down_proj", "model.layers.37.mlp.experts.94.down_proj", "model.layers.37.mlp.experts.95.down_proj", "model.layers.37.mlp.experts.96.down_proj", "model.layers.37.mlp.experts.97.down_proj", "model.layers.37.mlp.experts.98.down_proj", "model.layers.37.mlp.experts.99.down_proj", "model.layers.37.mlp.experts.100.down_proj", "model.layers.37.mlp.experts.101.down_proj", "model.layers.37.mlp.experts.102.down_proj", "model.layers.37.mlp.experts.103.down_proj", "model.layers.37.mlp.experts.104.down_proj", "model.layers.37.mlp.experts.105.down_proj", "model.layers.37.mlp.experts.106.down_proj", "model.layers.37.mlp.experts.107.down_proj", "model.layers.37.mlp.experts.108.down_proj", "model.layers.37.mlp.experts.109.down_proj", "model.layers.37.mlp.experts.110.down_proj", "model.layers.37.mlp.experts.111.down_proj", "model.layers.37.mlp.experts.112.down_proj", "model.layers.37.mlp.experts.113.down_proj", "model.layers.37.mlp.experts.114.down_proj", "model.layers.37.mlp.experts.115.down_proj", "model.layers.37.mlp.experts.116.down_proj", "model.layers.37.mlp.experts.117.down_proj", "model.layers.37.mlp.experts.118.down_proj", "model.layers.37.mlp.experts.119.down_proj", "model.layers.37.mlp.experts.120.down_proj", "model.layers.37.mlp.experts.121.down_proj", "model.layers.37.mlp.experts.122.down_proj", "model.layers.37.mlp.experts.123.down_proj", "model.layers.37.mlp.experts.124.down_proj", "model.layers.37.mlp.experts.125.down_proj", "model.layers.37.mlp.experts.126.down_proj", "model.layers.37.mlp.experts.127.down_proj", "model.layers.37.mlp.experts.128.down_proj", "model.layers.37.mlp.experts.129.down_proj", "model.layers.37.mlp.experts.130.down_proj", "model.layers.37.mlp.experts.131.down_proj", "model.layers.37.mlp.experts.132.down_proj", "model.layers.37.mlp.experts.133.down_proj", "model.layers.37.mlp.experts.134.down_proj", "model.layers.37.mlp.experts.135.down_proj", "model.layers.37.mlp.experts.136.down_proj", "model.layers.37.mlp.experts.137.down_proj", "model.layers.37.mlp.experts.138.down_proj", "model.layers.37.mlp.experts.139.down_proj", "model.layers.37.mlp.experts.140.down_proj", "model.layers.37.mlp.experts.141.down_proj", "model.layers.37.mlp.experts.142.down_proj", "model.layers.37.mlp.experts.143.down_proj", "model.layers.37.mlp.experts.144.down_proj", "model.layers.37.mlp.experts.145.down_proj", "model.layers.37.mlp.experts.146.down_proj", "model.layers.37.mlp.experts.147.down_proj", "model.layers.37.mlp.experts.148.down_proj", "model.layers.37.mlp.experts.149.down_proj", "model.layers.37.mlp.experts.150.down_proj", "model.layers.37.mlp.experts.151.down_proj", "model.layers.37.mlp.experts.152.down_proj", "model.layers.37.mlp.experts.153.down_proj", "model.layers.37.mlp.experts.154.down_proj", "model.layers.37.mlp.experts.155.down_proj", "model.layers.37.mlp.experts.156.down_proj", "model.layers.37.mlp.experts.157.down_proj", "model.layers.37.mlp.experts.158.down_proj", "model.layers.37.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -7.670186460017117e-06, "dbits": 1258291200 }, { "dkld": 4.768185317517021e-06, "dbits": 2516582400 } ] }, { "idx": 225, "layers": [ "model.layers.38.self_attn.q_proj" ], "candidates": [ { "dkld": -0.00011301408521830966, "dbits": 62914560 }, { "dkld": -0.0001055832719430317, "dbits": 125829120 } ] }, { "idx": 226, "layers": [ "model.layers.38.self_attn.k_proj", "model.layers.38.self_attn.v_proj" ], "candidates": [ { "dkld": 1.0586436837912994e-05, "dbits": 10485760 }, { "dkld": 1.1087581515313236e-05, "dbits": 20971520 } ] }, { "idx": 227, "layers": [ "model.layers.38.self_attn.o_proj" ], "candidates": [ { "dkld": -8.970058988779644e-05, "dbits": 62914560 }, { "dkld": -0.0001486945897340771, "dbits": 125829120 } ] }, { "idx": 228, "layers": [ "model.layers.38.mlp.shared_experts.gate_proj", "model.layers.38.mlp.shared_experts.up_proj", "model.layers.38.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -2.25256197154515e-05, "dbits": 23592960 }, { "dkld": 4.4975359924138286e-05, "dbits": 47185920 } ] }, { "idx": 229, "layers": [ "model.layers.38.mlp.experts.0.gate_proj", "model.layers.38.mlp.experts.1.gate_proj", "model.layers.38.mlp.experts.2.gate_proj", "model.layers.38.mlp.experts.3.gate_proj", "model.layers.38.mlp.experts.4.gate_proj", "model.layers.38.mlp.experts.5.gate_proj", "model.layers.38.mlp.experts.6.gate_proj", "model.layers.38.mlp.experts.7.gate_proj", "model.layers.38.mlp.experts.8.gate_proj", "model.layers.38.mlp.experts.9.gate_proj", "model.layers.38.mlp.experts.10.gate_proj", "model.layers.38.mlp.experts.11.gate_proj", "model.layers.38.mlp.experts.12.gate_proj", "model.layers.38.mlp.experts.13.gate_proj", "model.layers.38.mlp.experts.14.gate_proj", "model.layers.38.mlp.experts.15.gate_proj", "model.layers.38.mlp.experts.16.gate_proj", "model.layers.38.mlp.experts.17.gate_proj", "model.layers.38.mlp.experts.18.gate_proj", "model.layers.38.mlp.experts.19.gate_proj", "model.layers.38.mlp.experts.20.gate_proj", "model.layers.38.mlp.experts.21.gate_proj", "model.layers.38.mlp.experts.22.gate_proj", "model.layers.38.mlp.experts.23.gate_proj", "model.layers.38.mlp.experts.24.gate_proj", "model.layers.38.mlp.experts.25.gate_proj", "model.layers.38.mlp.experts.26.gate_proj", "model.layers.38.mlp.experts.27.gate_proj", "model.layers.38.mlp.experts.28.gate_proj", "model.layers.38.mlp.experts.29.gate_proj", "model.layers.38.mlp.experts.30.gate_proj", "model.layers.38.mlp.experts.31.gate_proj", "model.layers.38.mlp.experts.32.gate_proj", "model.layers.38.mlp.experts.33.gate_proj", "model.layers.38.mlp.experts.34.gate_proj", "model.layers.38.mlp.experts.35.gate_proj", "model.layers.38.mlp.experts.36.gate_proj", "model.layers.38.mlp.experts.37.gate_proj", "model.layers.38.mlp.experts.38.gate_proj", "model.layers.38.mlp.experts.39.gate_proj", "model.layers.38.mlp.experts.40.gate_proj", "model.layers.38.mlp.experts.41.gate_proj", "model.layers.38.mlp.experts.42.gate_proj", "model.layers.38.mlp.experts.43.gate_proj", "model.layers.38.mlp.experts.44.gate_proj", "model.layers.38.mlp.experts.45.gate_proj", "model.layers.38.mlp.experts.46.gate_proj", "model.layers.38.mlp.experts.47.gate_proj", "model.layers.38.mlp.experts.48.gate_proj", "model.layers.38.mlp.experts.49.gate_proj", "model.layers.38.mlp.experts.50.gate_proj", "model.layers.38.mlp.experts.51.gate_proj", "model.layers.38.mlp.experts.52.gate_proj", "model.layers.38.mlp.experts.53.gate_proj", "model.layers.38.mlp.experts.54.gate_proj", "model.layers.38.mlp.experts.55.gate_proj", "model.layers.38.mlp.experts.56.gate_proj", "model.layers.38.mlp.experts.57.gate_proj", "model.layers.38.mlp.experts.58.gate_proj", "model.layers.38.mlp.experts.59.gate_proj", "model.layers.38.mlp.experts.60.gate_proj", "model.layers.38.mlp.experts.61.gate_proj", "model.layers.38.mlp.experts.62.gate_proj", "model.layers.38.mlp.experts.63.gate_proj", "model.layers.38.mlp.experts.64.gate_proj", "model.layers.38.mlp.experts.65.gate_proj", "model.layers.38.mlp.experts.66.gate_proj", "model.layers.38.mlp.experts.67.gate_proj", "model.layers.38.mlp.experts.68.gate_proj", "model.layers.38.mlp.experts.69.gate_proj", "model.layers.38.mlp.experts.70.gate_proj", "model.layers.38.mlp.experts.71.gate_proj", "model.layers.38.mlp.experts.72.gate_proj", "model.layers.38.mlp.experts.73.gate_proj", "model.layers.38.mlp.experts.74.gate_proj", "model.layers.38.mlp.experts.75.gate_proj", "model.layers.38.mlp.experts.76.gate_proj", "model.layers.38.mlp.experts.77.gate_proj", "model.layers.38.mlp.experts.78.gate_proj", "model.layers.38.mlp.experts.79.gate_proj", "model.layers.38.mlp.experts.80.gate_proj", "model.layers.38.mlp.experts.81.gate_proj", "model.layers.38.mlp.experts.82.gate_proj", "model.layers.38.mlp.experts.83.gate_proj", "model.layers.38.mlp.experts.84.gate_proj", "model.layers.38.mlp.experts.85.gate_proj", "model.layers.38.mlp.experts.86.gate_proj", "model.layers.38.mlp.experts.87.gate_proj", "model.layers.38.mlp.experts.88.gate_proj", "model.layers.38.mlp.experts.89.gate_proj", "model.layers.38.mlp.experts.90.gate_proj", "model.layers.38.mlp.experts.91.gate_proj", "model.layers.38.mlp.experts.92.gate_proj", "model.layers.38.mlp.experts.93.gate_proj", "model.layers.38.mlp.experts.94.gate_proj", "model.layers.38.mlp.experts.95.gate_proj", "model.layers.38.mlp.experts.96.gate_proj", "model.layers.38.mlp.experts.97.gate_proj", "model.layers.38.mlp.experts.98.gate_proj", "model.layers.38.mlp.experts.99.gate_proj", "model.layers.38.mlp.experts.100.gate_proj", "model.layers.38.mlp.experts.101.gate_proj", "model.layers.38.mlp.experts.102.gate_proj", "model.layers.38.mlp.experts.103.gate_proj", "model.layers.38.mlp.experts.104.gate_proj", "model.layers.38.mlp.experts.105.gate_proj", "model.layers.38.mlp.experts.106.gate_proj", "model.layers.38.mlp.experts.107.gate_proj", "model.layers.38.mlp.experts.108.gate_proj", "model.layers.38.mlp.experts.109.gate_proj", "model.layers.38.mlp.experts.110.gate_proj", "model.layers.38.mlp.experts.111.gate_proj", "model.layers.38.mlp.experts.112.gate_proj", "model.layers.38.mlp.experts.113.gate_proj", "model.layers.38.mlp.experts.114.gate_proj", "model.layers.38.mlp.experts.115.gate_proj", "model.layers.38.mlp.experts.116.gate_proj", "model.layers.38.mlp.experts.117.gate_proj", "model.layers.38.mlp.experts.118.gate_proj", "model.layers.38.mlp.experts.119.gate_proj", "model.layers.38.mlp.experts.120.gate_proj", "model.layers.38.mlp.experts.121.gate_proj", "model.layers.38.mlp.experts.122.gate_proj", "model.layers.38.mlp.experts.123.gate_proj", "model.layers.38.mlp.experts.124.gate_proj", "model.layers.38.mlp.experts.125.gate_proj", "model.layers.38.mlp.experts.126.gate_proj", "model.layers.38.mlp.experts.127.gate_proj", "model.layers.38.mlp.experts.128.gate_proj", "model.layers.38.mlp.experts.129.gate_proj", "model.layers.38.mlp.experts.130.gate_proj", "model.layers.38.mlp.experts.131.gate_proj", "model.layers.38.mlp.experts.132.gate_proj", "model.layers.38.mlp.experts.133.gate_proj", "model.layers.38.mlp.experts.134.gate_proj", "model.layers.38.mlp.experts.135.gate_proj", "model.layers.38.mlp.experts.136.gate_proj", "model.layers.38.mlp.experts.137.gate_proj", "model.layers.38.mlp.experts.138.gate_proj", "model.layers.38.mlp.experts.139.gate_proj", "model.layers.38.mlp.experts.140.gate_proj", "model.layers.38.mlp.experts.141.gate_proj", "model.layers.38.mlp.experts.142.gate_proj", "model.layers.38.mlp.experts.143.gate_proj", "model.layers.38.mlp.experts.144.gate_proj", "model.layers.38.mlp.experts.145.gate_proj", "model.layers.38.mlp.experts.146.gate_proj", "model.layers.38.mlp.experts.147.gate_proj", "model.layers.38.mlp.experts.148.gate_proj", "model.layers.38.mlp.experts.149.gate_proj", "model.layers.38.mlp.experts.150.gate_proj", "model.layers.38.mlp.experts.151.gate_proj", "model.layers.38.mlp.experts.152.gate_proj", "model.layers.38.mlp.experts.153.gate_proj", "model.layers.38.mlp.experts.154.gate_proj", "model.layers.38.mlp.experts.155.gate_proj", "model.layers.38.mlp.experts.156.gate_proj", "model.layers.38.mlp.experts.157.gate_proj", "model.layers.38.mlp.experts.158.gate_proj", "model.layers.38.mlp.experts.159.gate_proj", "model.layers.38.mlp.experts.0.up_proj", "model.layers.38.mlp.experts.1.up_proj", "model.layers.38.mlp.experts.2.up_proj", "model.layers.38.mlp.experts.3.up_proj", "model.layers.38.mlp.experts.4.up_proj", "model.layers.38.mlp.experts.5.up_proj", "model.layers.38.mlp.experts.6.up_proj", "model.layers.38.mlp.experts.7.up_proj", "model.layers.38.mlp.experts.8.up_proj", "model.layers.38.mlp.experts.9.up_proj", "model.layers.38.mlp.experts.10.up_proj", "model.layers.38.mlp.experts.11.up_proj", "model.layers.38.mlp.experts.12.up_proj", "model.layers.38.mlp.experts.13.up_proj", "model.layers.38.mlp.experts.14.up_proj", "model.layers.38.mlp.experts.15.up_proj", "model.layers.38.mlp.experts.16.up_proj", "model.layers.38.mlp.experts.17.up_proj", "model.layers.38.mlp.experts.18.up_proj", "model.layers.38.mlp.experts.19.up_proj", "model.layers.38.mlp.experts.20.up_proj", "model.layers.38.mlp.experts.21.up_proj", "model.layers.38.mlp.experts.22.up_proj", "model.layers.38.mlp.experts.23.up_proj", "model.layers.38.mlp.experts.24.up_proj", "model.layers.38.mlp.experts.25.up_proj", "model.layers.38.mlp.experts.26.up_proj", "model.layers.38.mlp.experts.27.up_proj", "model.layers.38.mlp.experts.28.up_proj", "model.layers.38.mlp.experts.29.up_proj", "model.layers.38.mlp.experts.30.up_proj", "model.layers.38.mlp.experts.31.up_proj", "model.layers.38.mlp.experts.32.up_proj", "model.layers.38.mlp.experts.33.up_proj", "model.layers.38.mlp.experts.34.up_proj", "model.layers.38.mlp.experts.35.up_proj", "model.layers.38.mlp.experts.36.up_proj", "model.layers.38.mlp.experts.37.up_proj", "model.layers.38.mlp.experts.38.up_proj", "model.layers.38.mlp.experts.39.up_proj", "model.layers.38.mlp.experts.40.up_proj", "model.layers.38.mlp.experts.41.up_proj", "model.layers.38.mlp.experts.42.up_proj", "model.layers.38.mlp.experts.43.up_proj", "model.layers.38.mlp.experts.44.up_proj", "model.layers.38.mlp.experts.45.up_proj", "model.layers.38.mlp.experts.46.up_proj", "model.layers.38.mlp.experts.47.up_proj", "model.layers.38.mlp.experts.48.up_proj", "model.layers.38.mlp.experts.49.up_proj", "model.layers.38.mlp.experts.50.up_proj", "model.layers.38.mlp.experts.51.up_proj", "model.layers.38.mlp.experts.52.up_proj", "model.layers.38.mlp.experts.53.up_proj", "model.layers.38.mlp.experts.54.up_proj", "model.layers.38.mlp.experts.55.up_proj", "model.layers.38.mlp.experts.56.up_proj", "model.layers.38.mlp.experts.57.up_proj", "model.layers.38.mlp.experts.58.up_proj", "model.layers.38.mlp.experts.59.up_proj", "model.layers.38.mlp.experts.60.up_proj", "model.layers.38.mlp.experts.61.up_proj", "model.layers.38.mlp.experts.62.up_proj", "model.layers.38.mlp.experts.63.up_proj", "model.layers.38.mlp.experts.64.up_proj", "model.layers.38.mlp.experts.65.up_proj", "model.layers.38.mlp.experts.66.up_proj", "model.layers.38.mlp.experts.67.up_proj", "model.layers.38.mlp.experts.68.up_proj", "model.layers.38.mlp.experts.69.up_proj", "model.layers.38.mlp.experts.70.up_proj", "model.layers.38.mlp.experts.71.up_proj", "model.layers.38.mlp.experts.72.up_proj", "model.layers.38.mlp.experts.73.up_proj", "model.layers.38.mlp.experts.74.up_proj", "model.layers.38.mlp.experts.75.up_proj", "model.layers.38.mlp.experts.76.up_proj", "model.layers.38.mlp.experts.77.up_proj", "model.layers.38.mlp.experts.78.up_proj", "model.layers.38.mlp.experts.79.up_proj", "model.layers.38.mlp.experts.80.up_proj", "model.layers.38.mlp.experts.81.up_proj", "model.layers.38.mlp.experts.82.up_proj", "model.layers.38.mlp.experts.83.up_proj", "model.layers.38.mlp.experts.84.up_proj", "model.layers.38.mlp.experts.85.up_proj", "model.layers.38.mlp.experts.86.up_proj", "model.layers.38.mlp.experts.87.up_proj", "model.layers.38.mlp.experts.88.up_proj", "model.layers.38.mlp.experts.89.up_proj", "model.layers.38.mlp.experts.90.up_proj", "model.layers.38.mlp.experts.91.up_proj", "model.layers.38.mlp.experts.92.up_proj", "model.layers.38.mlp.experts.93.up_proj", "model.layers.38.mlp.experts.94.up_proj", "model.layers.38.mlp.experts.95.up_proj", "model.layers.38.mlp.experts.96.up_proj", "model.layers.38.mlp.experts.97.up_proj", "model.layers.38.mlp.experts.98.up_proj", "model.layers.38.mlp.experts.99.up_proj", "model.layers.38.mlp.experts.100.up_proj", "model.layers.38.mlp.experts.101.up_proj", "model.layers.38.mlp.experts.102.up_proj", "model.layers.38.mlp.experts.103.up_proj", "model.layers.38.mlp.experts.104.up_proj", "model.layers.38.mlp.experts.105.up_proj", "model.layers.38.mlp.experts.106.up_proj", "model.layers.38.mlp.experts.107.up_proj", "model.layers.38.mlp.experts.108.up_proj", "model.layers.38.mlp.experts.109.up_proj", "model.layers.38.mlp.experts.110.up_proj", "model.layers.38.mlp.experts.111.up_proj", "model.layers.38.mlp.experts.112.up_proj", "model.layers.38.mlp.experts.113.up_proj", "model.layers.38.mlp.experts.114.up_proj", "model.layers.38.mlp.experts.115.up_proj", "model.layers.38.mlp.experts.116.up_proj", "model.layers.38.mlp.experts.117.up_proj", "model.layers.38.mlp.experts.118.up_proj", "model.layers.38.mlp.experts.119.up_proj", "model.layers.38.mlp.experts.120.up_proj", "model.layers.38.mlp.experts.121.up_proj", "model.layers.38.mlp.experts.122.up_proj", "model.layers.38.mlp.experts.123.up_proj", "model.layers.38.mlp.experts.124.up_proj", "model.layers.38.mlp.experts.125.up_proj", "model.layers.38.mlp.experts.126.up_proj", "model.layers.38.mlp.experts.127.up_proj", "model.layers.38.mlp.experts.128.up_proj", "model.layers.38.mlp.experts.129.up_proj", "model.layers.38.mlp.experts.130.up_proj", "model.layers.38.mlp.experts.131.up_proj", "model.layers.38.mlp.experts.132.up_proj", "model.layers.38.mlp.experts.133.up_proj", "model.layers.38.mlp.experts.134.up_proj", "model.layers.38.mlp.experts.135.up_proj", "model.layers.38.mlp.experts.136.up_proj", "model.layers.38.mlp.experts.137.up_proj", "model.layers.38.mlp.experts.138.up_proj", "model.layers.38.mlp.experts.139.up_proj", "model.layers.38.mlp.experts.140.up_proj", "model.layers.38.mlp.experts.141.up_proj", "model.layers.38.mlp.experts.142.up_proj", "model.layers.38.mlp.experts.143.up_proj", "model.layers.38.mlp.experts.144.up_proj", "model.layers.38.mlp.experts.145.up_proj", "model.layers.38.mlp.experts.146.up_proj", "model.layers.38.mlp.experts.147.up_proj", "model.layers.38.mlp.experts.148.up_proj", "model.layers.38.mlp.experts.149.up_proj", "model.layers.38.mlp.experts.150.up_proj", "model.layers.38.mlp.experts.151.up_proj", "model.layers.38.mlp.experts.152.up_proj", "model.layers.38.mlp.experts.153.up_proj", "model.layers.38.mlp.experts.154.up_proj", "model.layers.38.mlp.experts.155.up_proj", "model.layers.38.mlp.experts.156.up_proj", "model.layers.38.mlp.experts.157.up_proj", "model.layers.38.mlp.experts.158.up_proj", "model.layers.38.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -8.057970553636447e-05, "dbits": 2516582400 }, { "dkld": -0.00011419311631470815, "dbits": 5033164800 } ] }, { "idx": 230, "layers": [ "model.layers.38.mlp.experts.0.down_proj", "model.layers.38.mlp.experts.1.down_proj", "model.layers.38.mlp.experts.2.down_proj", "model.layers.38.mlp.experts.3.down_proj", "model.layers.38.mlp.experts.4.down_proj", "model.layers.38.mlp.experts.5.down_proj", "model.layers.38.mlp.experts.6.down_proj", "model.layers.38.mlp.experts.7.down_proj", "model.layers.38.mlp.experts.8.down_proj", "model.layers.38.mlp.experts.9.down_proj", "model.layers.38.mlp.experts.10.down_proj", "model.layers.38.mlp.experts.11.down_proj", "model.layers.38.mlp.experts.12.down_proj", "model.layers.38.mlp.experts.13.down_proj", "model.layers.38.mlp.experts.14.down_proj", "model.layers.38.mlp.experts.15.down_proj", "model.layers.38.mlp.experts.16.down_proj", "model.layers.38.mlp.experts.17.down_proj", "model.layers.38.mlp.experts.18.down_proj", "model.layers.38.mlp.experts.19.down_proj", "model.layers.38.mlp.experts.20.down_proj", "model.layers.38.mlp.experts.21.down_proj", "model.layers.38.mlp.experts.22.down_proj", "model.layers.38.mlp.experts.23.down_proj", "model.layers.38.mlp.experts.24.down_proj", "model.layers.38.mlp.experts.25.down_proj", "model.layers.38.mlp.experts.26.down_proj", "model.layers.38.mlp.experts.27.down_proj", "model.layers.38.mlp.experts.28.down_proj", "model.layers.38.mlp.experts.29.down_proj", "model.layers.38.mlp.experts.30.down_proj", "model.layers.38.mlp.experts.31.down_proj", "model.layers.38.mlp.experts.32.down_proj", "model.layers.38.mlp.experts.33.down_proj", "model.layers.38.mlp.experts.34.down_proj", "model.layers.38.mlp.experts.35.down_proj", "model.layers.38.mlp.experts.36.down_proj", "model.layers.38.mlp.experts.37.down_proj", "model.layers.38.mlp.experts.38.down_proj", "model.layers.38.mlp.experts.39.down_proj", "model.layers.38.mlp.experts.40.down_proj", "model.layers.38.mlp.experts.41.down_proj", "model.layers.38.mlp.experts.42.down_proj", "model.layers.38.mlp.experts.43.down_proj", "model.layers.38.mlp.experts.44.down_proj", "model.layers.38.mlp.experts.45.down_proj", "model.layers.38.mlp.experts.46.down_proj", "model.layers.38.mlp.experts.47.down_proj", "model.layers.38.mlp.experts.48.down_proj", "model.layers.38.mlp.experts.49.down_proj", "model.layers.38.mlp.experts.50.down_proj", "model.layers.38.mlp.experts.51.down_proj", "model.layers.38.mlp.experts.52.down_proj", "model.layers.38.mlp.experts.53.down_proj", "model.layers.38.mlp.experts.54.down_proj", "model.layers.38.mlp.experts.55.down_proj", "model.layers.38.mlp.experts.56.down_proj", "model.layers.38.mlp.experts.57.down_proj", "model.layers.38.mlp.experts.58.down_proj", "model.layers.38.mlp.experts.59.down_proj", "model.layers.38.mlp.experts.60.down_proj", "model.layers.38.mlp.experts.61.down_proj", "model.layers.38.mlp.experts.62.down_proj", "model.layers.38.mlp.experts.63.down_proj", "model.layers.38.mlp.experts.64.down_proj", "model.layers.38.mlp.experts.65.down_proj", "model.layers.38.mlp.experts.66.down_proj", "model.layers.38.mlp.experts.67.down_proj", "model.layers.38.mlp.experts.68.down_proj", "model.layers.38.mlp.experts.69.down_proj", "model.layers.38.mlp.experts.70.down_proj", "model.layers.38.mlp.experts.71.down_proj", "model.layers.38.mlp.experts.72.down_proj", "model.layers.38.mlp.experts.73.down_proj", "model.layers.38.mlp.experts.74.down_proj", "model.layers.38.mlp.experts.75.down_proj", "model.layers.38.mlp.experts.76.down_proj", "model.layers.38.mlp.experts.77.down_proj", "model.layers.38.mlp.experts.78.down_proj", "model.layers.38.mlp.experts.79.down_proj", "model.layers.38.mlp.experts.80.down_proj", "model.layers.38.mlp.experts.81.down_proj", "model.layers.38.mlp.experts.82.down_proj", "model.layers.38.mlp.experts.83.down_proj", "model.layers.38.mlp.experts.84.down_proj", "model.layers.38.mlp.experts.85.down_proj", "model.layers.38.mlp.experts.86.down_proj", "model.layers.38.mlp.experts.87.down_proj", "model.layers.38.mlp.experts.88.down_proj", "model.layers.38.mlp.experts.89.down_proj", "model.layers.38.mlp.experts.90.down_proj", "model.layers.38.mlp.experts.91.down_proj", "model.layers.38.mlp.experts.92.down_proj", "model.layers.38.mlp.experts.93.down_proj", "model.layers.38.mlp.experts.94.down_proj", "model.layers.38.mlp.experts.95.down_proj", "model.layers.38.mlp.experts.96.down_proj", "model.layers.38.mlp.experts.97.down_proj", "model.layers.38.mlp.experts.98.down_proj", "model.layers.38.mlp.experts.99.down_proj", "model.layers.38.mlp.experts.100.down_proj", "model.layers.38.mlp.experts.101.down_proj", "model.layers.38.mlp.experts.102.down_proj", "model.layers.38.mlp.experts.103.down_proj", "model.layers.38.mlp.experts.104.down_proj", "model.layers.38.mlp.experts.105.down_proj", "model.layers.38.mlp.experts.106.down_proj", "model.layers.38.mlp.experts.107.down_proj", "model.layers.38.mlp.experts.108.down_proj", "model.layers.38.mlp.experts.109.down_proj", "model.layers.38.mlp.experts.110.down_proj", "model.layers.38.mlp.experts.111.down_proj", "model.layers.38.mlp.experts.112.down_proj", "model.layers.38.mlp.experts.113.down_proj", "model.layers.38.mlp.experts.114.down_proj", "model.layers.38.mlp.experts.115.down_proj", "model.layers.38.mlp.experts.116.down_proj", "model.layers.38.mlp.experts.117.down_proj", "model.layers.38.mlp.experts.118.down_proj", "model.layers.38.mlp.experts.119.down_proj", "model.layers.38.mlp.experts.120.down_proj", "model.layers.38.mlp.experts.121.down_proj", "model.layers.38.mlp.experts.122.down_proj", "model.layers.38.mlp.experts.123.down_proj", "model.layers.38.mlp.experts.124.down_proj", "model.layers.38.mlp.experts.125.down_proj", "model.layers.38.mlp.experts.126.down_proj", "model.layers.38.mlp.experts.127.down_proj", "model.layers.38.mlp.experts.128.down_proj", "model.layers.38.mlp.experts.129.down_proj", "model.layers.38.mlp.experts.130.down_proj", "model.layers.38.mlp.experts.131.down_proj", "model.layers.38.mlp.experts.132.down_proj", "model.layers.38.mlp.experts.133.down_proj", "model.layers.38.mlp.experts.134.down_proj", "model.layers.38.mlp.experts.135.down_proj", "model.layers.38.mlp.experts.136.down_proj", "model.layers.38.mlp.experts.137.down_proj", "model.layers.38.mlp.experts.138.down_proj", "model.layers.38.mlp.experts.139.down_proj", "model.layers.38.mlp.experts.140.down_proj", "model.layers.38.mlp.experts.141.down_proj", "model.layers.38.mlp.experts.142.down_proj", "model.layers.38.mlp.experts.143.down_proj", "model.layers.38.mlp.experts.144.down_proj", "model.layers.38.mlp.experts.145.down_proj", "model.layers.38.mlp.experts.146.down_proj", "model.layers.38.mlp.experts.147.down_proj", "model.layers.38.mlp.experts.148.down_proj", "model.layers.38.mlp.experts.149.down_proj", "model.layers.38.mlp.experts.150.down_proj", "model.layers.38.mlp.experts.151.down_proj", "model.layers.38.mlp.experts.152.down_proj", "model.layers.38.mlp.experts.153.down_proj", "model.layers.38.mlp.experts.154.down_proj", "model.layers.38.mlp.experts.155.down_proj", "model.layers.38.mlp.experts.156.down_proj", "model.layers.38.mlp.experts.157.down_proj", "model.layers.38.mlp.experts.158.down_proj", "model.layers.38.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.0387675613164555e-05, "dbits": 1258291200 }, { "dkld": -4.1123293340205105e-05, "dbits": 2516582400 } ] }, { "idx": 231, "layers": [ "model.layers.39.self_attn.q_proj" ], "candidates": [ { "dkld": -7.699227426201036e-05, "dbits": 62914560 }, { "dkld": -5.331013817340066e-05, "dbits": 125829120 } ] }, { "idx": 232, "layers": [ "model.layers.39.self_attn.k_proj", "model.layers.39.self_attn.v_proj" ], "candidates": [ { "dkld": -0.0004025107948109497, "dbits": 10485760 }, { "dkld": -0.0004221520386636247, "dbits": 20971520 } ] }, { "idx": 233, "layers": [ "model.layers.39.self_attn.o_proj" ], "candidates": [ { "dkld": 0.00012785305734723876, "dbits": 62914560 }, { "dkld": 5.454879719764098e-05, "dbits": 125829120 } ] }, { "idx": 234, "layers": [ "model.layers.39.mlp.shared_experts.gate_proj", "model.layers.39.mlp.shared_experts.up_proj", "model.layers.39.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.0001486854162067175, "dbits": 23592960 }, { "dkld": -0.00019448804669082095, "dbits": 47185920 } ] }, { "idx": 235, "layers": [ "model.layers.39.mlp.experts.0.gate_proj", "model.layers.39.mlp.experts.1.gate_proj", "model.layers.39.mlp.experts.2.gate_proj", "model.layers.39.mlp.experts.3.gate_proj", "model.layers.39.mlp.experts.4.gate_proj", "model.layers.39.mlp.experts.5.gate_proj", "model.layers.39.mlp.experts.6.gate_proj", "model.layers.39.mlp.experts.7.gate_proj", "model.layers.39.mlp.experts.8.gate_proj", "model.layers.39.mlp.experts.9.gate_proj", "model.layers.39.mlp.experts.10.gate_proj", "model.layers.39.mlp.experts.11.gate_proj", "model.layers.39.mlp.experts.12.gate_proj", "model.layers.39.mlp.experts.13.gate_proj", "model.layers.39.mlp.experts.14.gate_proj", "model.layers.39.mlp.experts.15.gate_proj", "model.layers.39.mlp.experts.16.gate_proj", "model.layers.39.mlp.experts.17.gate_proj", "model.layers.39.mlp.experts.18.gate_proj", "model.layers.39.mlp.experts.19.gate_proj", "model.layers.39.mlp.experts.20.gate_proj", "model.layers.39.mlp.experts.21.gate_proj", "model.layers.39.mlp.experts.22.gate_proj", "model.layers.39.mlp.experts.23.gate_proj", "model.layers.39.mlp.experts.24.gate_proj", "model.layers.39.mlp.experts.25.gate_proj", "model.layers.39.mlp.experts.26.gate_proj", "model.layers.39.mlp.experts.27.gate_proj", "model.layers.39.mlp.experts.28.gate_proj", "model.layers.39.mlp.experts.29.gate_proj", "model.layers.39.mlp.experts.30.gate_proj", "model.layers.39.mlp.experts.31.gate_proj", "model.layers.39.mlp.experts.32.gate_proj", "model.layers.39.mlp.experts.33.gate_proj", "model.layers.39.mlp.experts.34.gate_proj", "model.layers.39.mlp.experts.35.gate_proj", "model.layers.39.mlp.experts.36.gate_proj", "model.layers.39.mlp.experts.37.gate_proj", "model.layers.39.mlp.experts.38.gate_proj", "model.layers.39.mlp.experts.39.gate_proj", "model.layers.39.mlp.experts.40.gate_proj", "model.layers.39.mlp.experts.41.gate_proj", "model.layers.39.mlp.experts.42.gate_proj", "model.layers.39.mlp.experts.43.gate_proj", "model.layers.39.mlp.experts.44.gate_proj", "model.layers.39.mlp.experts.45.gate_proj", "model.layers.39.mlp.experts.46.gate_proj", "model.layers.39.mlp.experts.47.gate_proj", "model.layers.39.mlp.experts.48.gate_proj", "model.layers.39.mlp.experts.49.gate_proj", "model.layers.39.mlp.experts.50.gate_proj", "model.layers.39.mlp.experts.51.gate_proj", "model.layers.39.mlp.experts.52.gate_proj", "model.layers.39.mlp.experts.53.gate_proj", "model.layers.39.mlp.experts.54.gate_proj", "model.layers.39.mlp.experts.55.gate_proj", "model.layers.39.mlp.experts.56.gate_proj", "model.layers.39.mlp.experts.57.gate_proj", "model.layers.39.mlp.experts.58.gate_proj", "model.layers.39.mlp.experts.59.gate_proj", "model.layers.39.mlp.experts.60.gate_proj", "model.layers.39.mlp.experts.61.gate_proj", "model.layers.39.mlp.experts.62.gate_proj", "model.layers.39.mlp.experts.63.gate_proj", "model.layers.39.mlp.experts.64.gate_proj", "model.layers.39.mlp.experts.65.gate_proj", "model.layers.39.mlp.experts.66.gate_proj", "model.layers.39.mlp.experts.67.gate_proj", "model.layers.39.mlp.experts.68.gate_proj", "model.layers.39.mlp.experts.69.gate_proj", "model.layers.39.mlp.experts.70.gate_proj", "model.layers.39.mlp.experts.71.gate_proj", "model.layers.39.mlp.experts.72.gate_proj", "model.layers.39.mlp.experts.73.gate_proj", "model.layers.39.mlp.experts.74.gate_proj", "model.layers.39.mlp.experts.75.gate_proj", "model.layers.39.mlp.experts.76.gate_proj", "model.layers.39.mlp.experts.77.gate_proj", "model.layers.39.mlp.experts.78.gate_proj", "model.layers.39.mlp.experts.79.gate_proj", "model.layers.39.mlp.experts.80.gate_proj", "model.layers.39.mlp.experts.81.gate_proj", "model.layers.39.mlp.experts.82.gate_proj", "model.layers.39.mlp.experts.83.gate_proj", "model.layers.39.mlp.experts.84.gate_proj", "model.layers.39.mlp.experts.85.gate_proj", "model.layers.39.mlp.experts.86.gate_proj", "model.layers.39.mlp.experts.87.gate_proj", "model.layers.39.mlp.experts.88.gate_proj", "model.layers.39.mlp.experts.89.gate_proj", "model.layers.39.mlp.experts.90.gate_proj", "model.layers.39.mlp.experts.91.gate_proj", "model.layers.39.mlp.experts.92.gate_proj", "model.layers.39.mlp.experts.93.gate_proj", "model.layers.39.mlp.experts.94.gate_proj", "model.layers.39.mlp.experts.95.gate_proj", "model.layers.39.mlp.experts.96.gate_proj", "model.layers.39.mlp.experts.97.gate_proj", "model.layers.39.mlp.experts.98.gate_proj", "model.layers.39.mlp.experts.99.gate_proj", "model.layers.39.mlp.experts.100.gate_proj", "model.layers.39.mlp.experts.101.gate_proj", "model.layers.39.mlp.experts.102.gate_proj", "model.layers.39.mlp.experts.103.gate_proj", "model.layers.39.mlp.experts.104.gate_proj", "model.layers.39.mlp.experts.105.gate_proj", "model.layers.39.mlp.experts.106.gate_proj", "model.layers.39.mlp.experts.107.gate_proj", "model.layers.39.mlp.experts.108.gate_proj", "model.layers.39.mlp.experts.109.gate_proj", "model.layers.39.mlp.experts.110.gate_proj", "model.layers.39.mlp.experts.111.gate_proj", "model.layers.39.mlp.experts.112.gate_proj", "model.layers.39.mlp.experts.113.gate_proj", "model.layers.39.mlp.experts.114.gate_proj", "model.layers.39.mlp.experts.115.gate_proj", "model.layers.39.mlp.experts.116.gate_proj", "model.layers.39.mlp.experts.117.gate_proj", "model.layers.39.mlp.experts.118.gate_proj", "model.layers.39.mlp.experts.119.gate_proj", "model.layers.39.mlp.experts.120.gate_proj", "model.layers.39.mlp.experts.121.gate_proj", "model.layers.39.mlp.experts.122.gate_proj", "model.layers.39.mlp.experts.123.gate_proj", "model.layers.39.mlp.experts.124.gate_proj", "model.layers.39.mlp.experts.125.gate_proj", "model.layers.39.mlp.experts.126.gate_proj", "model.layers.39.mlp.experts.127.gate_proj", "model.layers.39.mlp.experts.128.gate_proj", "model.layers.39.mlp.experts.129.gate_proj", "model.layers.39.mlp.experts.130.gate_proj", "model.layers.39.mlp.experts.131.gate_proj", "model.layers.39.mlp.experts.132.gate_proj", "model.layers.39.mlp.experts.133.gate_proj", "model.layers.39.mlp.experts.134.gate_proj", "model.layers.39.mlp.experts.135.gate_proj", "model.layers.39.mlp.experts.136.gate_proj", "model.layers.39.mlp.experts.137.gate_proj", "model.layers.39.mlp.experts.138.gate_proj", "model.layers.39.mlp.experts.139.gate_proj", "model.layers.39.mlp.experts.140.gate_proj", "model.layers.39.mlp.experts.141.gate_proj", "model.layers.39.mlp.experts.142.gate_proj", "model.layers.39.mlp.experts.143.gate_proj", "model.layers.39.mlp.experts.144.gate_proj", "model.layers.39.mlp.experts.145.gate_proj", "model.layers.39.mlp.experts.146.gate_proj", "model.layers.39.mlp.experts.147.gate_proj", "model.layers.39.mlp.experts.148.gate_proj", "model.layers.39.mlp.experts.149.gate_proj", "model.layers.39.mlp.experts.150.gate_proj", "model.layers.39.mlp.experts.151.gate_proj", "model.layers.39.mlp.experts.152.gate_proj", "model.layers.39.mlp.experts.153.gate_proj", "model.layers.39.mlp.experts.154.gate_proj", "model.layers.39.mlp.experts.155.gate_proj", "model.layers.39.mlp.experts.156.gate_proj", "model.layers.39.mlp.experts.157.gate_proj", "model.layers.39.mlp.experts.158.gate_proj", "model.layers.39.mlp.experts.159.gate_proj", "model.layers.39.mlp.experts.0.up_proj", "model.layers.39.mlp.experts.1.up_proj", "model.layers.39.mlp.experts.2.up_proj", "model.layers.39.mlp.experts.3.up_proj", "model.layers.39.mlp.experts.4.up_proj", "model.layers.39.mlp.experts.5.up_proj", "model.layers.39.mlp.experts.6.up_proj", "model.layers.39.mlp.experts.7.up_proj", "model.layers.39.mlp.experts.8.up_proj", "model.layers.39.mlp.experts.9.up_proj", "model.layers.39.mlp.experts.10.up_proj", "model.layers.39.mlp.experts.11.up_proj", "model.layers.39.mlp.experts.12.up_proj", "model.layers.39.mlp.experts.13.up_proj", "model.layers.39.mlp.experts.14.up_proj", "model.layers.39.mlp.experts.15.up_proj", "model.layers.39.mlp.experts.16.up_proj", "model.layers.39.mlp.experts.17.up_proj", "model.layers.39.mlp.experts.18.up_proj", "model.layers.39.mlp.experts.19.up_proj", "model.layers.39.mlp.experts.20.up_proj", "model.layers.39.mlp.experts.21.up_proj", "model.layers.39.mlp.experts.22.up_proj", "model.layers.39.mlp.experts.23.up_proj", "model.layers.39.mlp.experts.24.up_proj", "model.layers.39.mlp.experts.25.up_proj", "model.layers.39.mlp.experts.26.up_proj", "model.layers.39.mlp.experts.27.up_proj", "model.layers.39.mlp.experts.28.up_proj", "model.layers.39.mlp.experts.29.up_proj", "model.layers.39.mlp.experts.30.up_proj", "model.layers.39.mlp.experts.31.up_proj", "model.layers.39.mlp.experts.32.up_proj", "model.layers.39.mlp.experts.33.up_proj", "model.layers.39.mlp.experts.34.up_proj", "model.layers.39.mlp.experts.35.up_proj", "model.layers.39.mlp.experts.36.up_proj", "model.layers.39.mlp.experts.37.up_proj", "model.layers.39.mlp.experts.38.up_proj", "model.layers.39.mlp.experts.39.up_proj", "model.layers.39.mlp.experts.40.up_proj", "model.layers.39.mlp.experts.41.up_proj", "model.layers.39.mlp.experts.42.up_proj", "model.layers.39.mlp.experts.43.up_proj", "model.layers.39.mlp.experts.44.up_proj", "model.layers.39.mlp.experts.45.up_proj", "model.layers.39.mlp.experts.46.up_proj", "model.layers.39.mlp.experts.47.up_proj", "model.layers.39.mlp.experts.48.up_proj", "model.layers.39.mlp.experts.49.up_proj", "model.layers.39.mlp.experts.50.up_proj", "model.layers.39.mlp.experts.51.up_proj", "model.layers.39.mlp.experts.52.up_proj", "model.layers.39.mlp.experts.53.up_proj", "model.layers.39.mlp.experts.54.up_proj", "model.layers.39.mlp.experts.55.up_proj", "model.layers.39.mlp.experts.56.up_proj", "model.layers.39.mlp.experts.57.up_proj", "model.layers.39.mlp.experts.58.up_proj", "model.layers.39.mlp.experts.59.up_proj", "model.layers.39.mlp.experts.60.up_proj", "model.layers.39.mlp.experts.61.up_proj", "model.layers.39.mlp.experts.62.up_proj", "model.layers.39.mlp.experts.63.up_proj", "model.layers.39.mlp.experts.64.up_proj", "model.layers.39.mlp.experts.65.up_proj", "model.layers.39.mlp.experts.66.up_proj", "model.layers.39.mlp.experts.67.up_proj", "model.layers.39.mlp.experts.68.up_proj", "model.layers.39.mlp.experts.69.up_proj", "model.layers.39.mlp.experts.70.up_proj", "model.layers.39.mlp.experts.71.up_proj", "model.layers.39.mlp.experts.72.up_proj", "model.layers.39.mlp.experts.73.up_proj", "model.layers.39.mlp.experts.74.up_proj", "model.layers.39.mlp.experts.75.up_proj", "model.layers.39.mlp.experts.76.up_proj", "model.layers.39.mlp.experts.77.up_proj", "model.layers.39.mlp.experts.78.up_proj", "model.layers.39.mlp.experts.79.up_proj", "model.layers.39.mlp.experts.80.up_proj", "model.layers.39.mlp.experts.81.up_proj", "model.layers.39.mlp.experts.82.up_proj", "model.layers.39.mlp.experts.83.up_proj", "model.layers.39.mlp.experts.84.up_proj", "model.layers.39.mlp.experts.85.up_proj", "model.layers.39.mlp.experts.86.up_proj", "model.layers.39.mlp.experts.87.up_proj", "model.layers.39.mlp.experts.88.up_proj", "model.layers.39.mlp.experts.89.up_proj", "model.layers.39.mlp.experts.90.up_proj", "model.layers.39.mlp.experts.91.up_proj", "model.layers.39.mlp.experts.92.up_proj", "model.layers.39.mlp.experts.93.up_proj", "model.layers.39.mlp.experts.94.up_proj", "model.layers.39.mlp.experts.95.up_proj", "model.layers.39.mlp.experts.96.up_proj", "model.layers.39.mlp.experts.97.up_proj", "model.layers.39.mlp.experts.98.up_proj", "model.layers.39.mlp.experts.99.up_proj", "model.layers.39.mlp.experts.100.up_proj", "model.layers.39.mlp.experts.101.up_proj", "model.layers.39.mlp.experts.102.up_proj", "model.layers.39.mlp.experts.103.up_proj", "model.layers.39.mlp.experts.104.up_proj", "model.layers.39.mlp.experts.105.up_proj", "model.layers.39.mlp.experts.106.up_proj", "model.layers.39.mlp.experts.107.up_proj", "model.layers.39.mlp.experts.108.up_proj", "model.layers.39.mlp.experts.109.up_proj", "model.layers.39.mlp.experts.110.up_proj", "model.layers.39.mlp.experts.111.up_proj", "model.layers.39.mlp.experts.112.up_proj", "model.layers.39.mlp.experts.113.up_proj", "model.layers.39.mlp.experts.114.up_proj", "model.layers.39.mlp.experts.115.up_proj", "model.layers.39.mlp.experts.116.up_proj", "model.layers.39.mlp.experts.117.up_proj", "model.layers.39.mlp.experts.118.up_proj", "model.layers.39.mlp.experts.119.up_proj", "model.layers.39.mlp.experts.120.up_proj", "model.layers.39.mlp.experts.121.up_proj", "model.layers.39.mlp.experts.122.up_proj", "model.layers.39.mlp.experts.123.up_proj", "model.layers.39.mlp.experts.124.up_proj", "model.layers.39.mlp.experts.125.up_proj", "model.layers.39.mlp.experts.126.up_proj", "model.layers.39.mlp.experts.127.up_proj", "model.layers.39.mlp.experts.128.up_proj", "model.layers.39.mlp.experts.129.up_proj", "model.layers.39.mlp.experts.130.up_proj", "model.layers.39.mlp.experts.131.up_proj", "model.layers.39.mlp.experts.132.up_proj", "model.layers.39.mlp.experts.133.up_proj", "model.layers.39.mlp.experts.134.up_proj", "model.layers.39.mlp.experts.135.up_proj", "model.layers.39.mlp.experts.136.up_proj", "model.layers.39.mlp.experts.137.up_proj", "model.layers.39.mlp.experts.138.up_proj", "model.layers.39.mlp.experts.139.up_proj", "model.layers.39.mlp.experts.140.up_proj", "model.layers.39.mlp.experts.141.up_proj", "model.layers.39.mlp.experts.142.up_proj", "model.layers.39.mlp.experts.143.up_proj", "model.layers.39.mlp.experts.144.up_proj", "model.layers.39.mlp.experts.145.up_proj", "model.layers.39.mlp.experts.146.up_proj", "model.layers.39.mlp.experts.147.up_proj", "model.layers.39.mlp.experts.148.up_proj", "model.layers.39.mlp.experts.149.up_proj", "model.layers.39.mlp.experts.150.up_proj", "model.layers.39.mlp.experts.151.up_proj", "model.layers.39.mlp.experts.152.up_proj", "model.layers.39.mlp.experts.153.up_proj", "model.layers.39.mlp.experts.154.up_proj", "model.layers.39.mlp.experts.155.up_proj", "model.layers.39.mlp.experts.156.up_proj", "model.layers.39.mlp.experts.157.up_proj", "model.layers.39.mlp.experts.158.up_proj", "model.layers.39.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.2517733052371545e-05, "dbits": 2516582400 }, { "dkld": -2.5416770949958714e-05, "dbits": 5033164800 } ] }, { "idx": 236, "layers": [ "model.layers.39.mlp.experts.0.down_proj", "model.layers.39.mlp.experts.1.down_proj", "model.layers.39.mlp.experts.2.down_proj", "model.layers.39.mlp.experts.3.down_proj", "model.layers.39.mlp.experts.4.down_proj", "model.layers.39.mlp.experts.5.down_proj", "model.layers.39.mlp.experts.6.down_proj", "model.layers.39.mlp.experts.7.down_proj", "model.layers.39.mlp.experts.8.down_proj", "model.layers.39.mlp.experts.9.down_proj", "model.layers.39.mlp.experts.10.down_proj", "model.layers.39.mlp.experts.11.down_proj", "model.layers.39.mlp.experts.12.down_proj", "model.layers.39.mlp.experts.13.down_proj", "model.layers.39.mlp.experts.14.down_proj", "model.layers.39.mlp.experts.15.down_proj", "model.layers.39.mlp.experts.16.down_proj", "model.layers.39.mlp.experts.17.down_proj", "model.layers.39.mlp.experts.18.down_proj", "model.layers.39.mlp.experts.19.down_proj", "model.layers.39.mlp.experts.20.down_proj", "model.layers.39.mlp.experts.21.down_proj", "model.layers.39.mlp.experts.22.down_proj", "model.layers.39.mlp.experts.23.down_proj", "model.layers.39.mlp.experts.24.down_proj", "model.layers.39.mlp.experts.25.down_proj", "model.layers.39.mlp.experts.26.down_proj", "model.layers.39.mlp.experts.27.down_proj", "model.layers.39.mlp.experts.28.down_proj", "model.layers.39.mlp.experts.29.down_proj", "model.layers.39.mlp.experts.30.down_proj", "model.layers.39.mlp.experts.31.down_proj", "model.layers.39.mlp.experts.32.down_proj", "model.layers.39.mlp.experts.33.down_proj", "model.layers.39.mlp.experts.34.down_proj", "model.layers.39.mlp.experts.35.down_proj", "model.layers.39.mlp.experts.36.down_proj", "model.layers.39.mlp.experts.37.down_proj", "model.layers.39.mlp.experts.38.down_proj", "model.layers.39.mlp.experts.39.down_proj", "model.layers.39.mlp.experts.40.down_proj", "model.layers.39.mlp.experts.41.down_proj", "model.layers.39.mlp.experts.42.down_proj", "model.layers.39.mlp.experts.43.down_proj", "model.layers.39.mlp.experts.44.down_proj", "model.layers.39.mlp.experts.45.down_proj", "model.layers.39.mlp.experts.46.down_proj", "model.layers.39.mlp.experts.47.down_proj", "model.layers.39.mlp.experts.48.down_proj", "model.layers.39.mlp.experts.49.down_proj", "model.layers.39.mlp.experts.50.down_proj", "model.layers.39.mlp.experts.51.down_proj", "model.layers.39.mlp.experts.52.down_proj", "model.layers.39.mlp.experts.53.down_proj", "model.layers.39.mlp.experts.54.down_proj", "model.layers.39.mlp.experts.55.down_proj", "model.layers.39.mlp.experts.56.down_proj", "model.layers.39.mlp.experts.57.down_proj", "model.layers.39.mlp.experts.58.down_proj", "model.layers.39.mlp.experts.59.down_proj", "model.layers.39.mlp.experts.60.down_proj", "model.layers.39.mlp.experts.61.down_proj", "model.layers.39.mlp.experts.62.down_proj", "model.layers.39.mlp.experts.63.down_proj", "model.layers.39.mlp.experts.64.down_proj", "model.layers.39.mlp.experts.65.down_proj", "model.layers.39.mlp.experts.66.down_proj", "model.layers.39.mlp.experts.67.down_proj", "model.layers.39.mlp.experts.68.down_proj", "model.layers.39.mlp.experts.69.down_proj", "model.layers.39.mlp.experts.70.down_proj", "model.layers.39.mlp.experts.71.down_proj", "model.layers.39.mlp.experts.72.down_proj", "model.layers.39.mlp.experts.73.down_proj", "model.layers.39.mlp.experts.74.down_proj", "model.layers.39.mlp.experts.75.down_proj", "model.layers.39.mlp.experts.76.down_proj", "model.layers.39.mlp.experts.77.down_proj", "model.layers.39.mlp.experts.78.down_proj", "model.layers.39.mlp.experts.79.down_proj", "model.layers.39.mlp.experts.80.down_proj", "model.layers.39.mlp.experts.81.down_proj", "model.layers.39.mlp.experts.82.down_proj", "model.layers.39.mlp.experts.83.down_proj", "model.layers.39.mlp.experts.84.down_proj", "model.layers.39.mlp.experts.85.down_proj", "model.layers.39.mlp.experts.86.down_proj", "model.layers.39.mlp.experts.87.down_proj", "model.layers.39.mlp.experts.88.down_proj", "model.layers.39.mlp.experts.89.down_proj", "model.layers.39.mlp.experts.90.down_proj", "model.layers.39.mlp.experts.91.down_proj", "model.layers.39.mlp.experts.92.down_proj", "model.layers.39.mlp.experts.93.down_proj", "model.layers.39.mlp.experts.94.down_proj", "model.layers.39.mlp.experts.95.down_proj", "model.layers.39.mlp.experts.96.down_proj", "model.layers.39.mlp.experts.97.down_proj", "model.layers.39.mlp.experts.98.down_proj", "model.layers.39.mlp.experts.99.down_proj", "model.layers.39.mlp.experts.100.down_proj", "model.layers.39.mlp.experts.101.down_proj", "model.layers.39.mlp.experts.102.down_proj", "model.layers.39.mlp.experts.103.down_proj", "model.layers.39.mlp.experts.104.down_proj", "model.layers.39.mlp.experts.105.down_proj", "model.layers.39.mlp.experts.106.down_proj", "model.layers.39.mlp.experts.107.down_proj", "model.layers.39.mlp.experts.108.down_proj", "model.layers.39.mlp.experts.109.down_proj", "model.layers.39.mlp.experts.110.down_proj", "model.layers.39.mlp.experts.111.down_proj", "model.layers.39.mlp.experts.112.down_proj", "model.layers.39.mlp.experts.113.down_proj", "model.layers.39.mlp.experts.114.down_proj", "model.layers.39.mlp.experts.115.down_proj", "model.layers.39.mlp.experts.116.down_proj", "model.layers.39.mlp.experts.117.down_proj", "model.layers.39.mlp.experts.118.down_proj", "model.layers.39.mlp.experts.119.down_proj", "model.layers.39.mlp.experts.120.down_proj", "model.layers.39.mlp.experts.121.down_proj", "model.layers.39.mlp.experts.122.down_proj", "model.layers.39.mlp.experts.123.down_proj", "model.layers.39.mlp.experts.124.down_proj", "model.layers.39.mlp.experts.125.down_proj", "model.layers.39.mlp.experts.126.down_proj", "model.layers.39.mlp.experts.127.down_proj", "model.layers.39.mlp.experts.128.down_proj", "model.layers.39.mlp.experts.129.down_proj", "model.layers.39.mlp.experts.130.down_proj", "model.layers.39.mlp.experts.131.down_proj", "model.layers.39.mlp.experts.132.down_proj", "model.layers.39.mlp.experts.133.down_proj", "model.layers.39.mlp.experts.134.down_proj", "model.layers.39.mlp.experts.135.down_proj", "model.layers.39.mlp.experts.136.down_proj", "model.layers.39.mlp.experts.137.down_proj", "model.layers.39.mlp.experts.138.down_proj", "model.layers.39.mlp.experts.139.down_proj", "model.layers.39.mlp.experts.140.down_proj", "model.layers.39.mlp.experts.141.down_proj", "model.layers.39.mlp.experts.142.down_proj", "model.layers.39.mlp.experts.143.down_proj", "model.layers.39.mlp.experts.144.down_proj", "model.layers.39.mlp.experts.145.down_proj", "model.layers.39.mlp.experts.146.down_proj", "model.layers.39.mlp.experts.147.down_proj", "model.layers.39.mlp.experts.148.down_proj", "model.layers.39.mlp.experts.149.down_proj", "model.layers.39.mlp.experts.150.down_proj", "model.layers.39.mlp.experts.151.down_proj", "model.layers.39.mlp.experts.152.down_proj", "model.layers.39.mlp.experts.153.down_proj", "model.layers.39.mlp.experts.154.down_proj", "model.layers.39.mlp.experts.155.down_proj", "model.layers.39.mlp.experts.156.down_proj", "model.layers.39.mlp.experts.157.down_proj", "model.layers.39.mlp.experts.158.down_proj", "model.layers.39.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -3.3475598320363564e-05, "dbits": 1258291200 }, { "dkld": -2.7550989761947198e-05, "dbits": 2516582400 } ] }, { "idx": 237, "layers": [ "model.layers.40.self_attn.q_proj" ], "candidates": [ { "dkld": -1.1326349340378544e-05, "dbits": 62914560 }, { "dkld": -1.6247853636741638e-05, "dbits": 125829120 } ] }, { "idx": 238, "layers": [ "model.layers.40.self_attn.k_proj", "model.layers.40.self_attn.v_proj" ], "candidates": [ { "dkld": -0.0001803796272724853, "dbits": 10485760 }, { "dkld": -0.00011054326314479009, "dbits": 20971520 } ] }, { "idx": 239, "layers": [ "model.layers.40.self_attn.o_proj" ], "candidates": [ { "dkld": -0.00014479490928351844, "dbits": 62914560 }, { "dkld": -0.00020684762857854297, "dbits": 125829120 } ] }, { "idx": 240, "layers": [ "model.layers.40.mlp.shared_experts.gate_proj", "model.layers.40.mlp.shared_experts.up_proj", "model.layers.40.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -7.342621684074298e-05, "dbits": 23592960 }, { "dkld": -9.552435949444771e-05, "dbits": 47185920 } ] }, { "idx": 241, "layers": [ "model.layers.40.mlp.experts.0.gate_proj", "model.layers.40.mlp.experts.1.gate_proj", "model.layers.40.mlp.experts.2.gate_proj", "model.layers.40.mlp.experts.3.gate_proj", "model.layers.40.mlp.experts.4.gate_proj", "model.layers.40.mlp.experts.5.gate_proj", "model.layers.40.mlp.experts.6.gate_proj", "model.layers.40.mlp.experts.7.gate_proj", "model.layers.40.mlp.experts.8.gate_proj", "model.layers.40.mlp.experts.9.gate_proj", "model.layers.40.mlp.experts.10.gate_proj", "model.layers.40.mlp.experts.11.gate_proj", "model.layers.40.mlp.experts.12.gate_proj", "model.layers.40.mlp.experts.13.gate_proj", "model.layers.40.mlp.experts.14.gate_proj", "model.layers.40.mlp.experts.15.gate_proj", "model.layers.40.mlp.experts.16.gate_proj", "model.layers.40.mlp.experts.17.gate_proj", "model.layers.40.mlp.experts.18.gate_proj", "model.layers.40.mlp.experts.19.gate_proj", "model.layers.40.mlp.experts.20.gate_proj", "model.layers.40.mlp.experts.21.gate_proj", "model.layers.40.mlp.experts.22.gate_proj", "model.layers.40.mlp.experts.23.gate_proj", "model.layers.40.mlp.experts.24.gate_proj", "model.layers.40.mlp.experts.25.gate_proj", "model.layers.40.mlp.experts.26.gate_proj", "model.layers.40.mlp.experts.27.gate_proj", "model.layers.40.mlp.experts.28.gate_proj", "model.layers.40.mlp.experts.29.gate_proj", "model.layers.40.mlp.experts.30.gate_proj", "model.layers.40.mlp.experts.31.gate_proj", "model.layers.40.mlp.experts.32.gate_proj", "model.layers.40.mlp.experts.33.gate_proj", "model.layers.40.mlp.experts.34.gate_proj", "model.layers.40.mlp.experts.35.gate_proj", "model.layers.40.mlp.experts.36.gate_proj", "model.layers.40.mlp.experts.37.gate_proj", "model.layers.40.mlp.experts.38.gate_proj", "model.layers.40.mlp.experts.39.gate_proj", "model.layers.40.mlp.experts.40.gate_proj", "model.layers.40.mlp.experts.41.gate_proj", "model.layers.40.mlp.experts.42.gate_proj", "model.layers.40.mlp.experts.43.gate_proj", "model.layers.40.mlp.experts.44.gate_proj", "model.layers.40.mlp.experts.45.gate_proj", "model.layers.40.mlp.experts.46.gate_proj", "model.layers.40.mlp.experts.47.gate_proj", "model.layers.40.mlp.experts.48.gate_proj", "model.layers.40.mlp.experts.49.gate_proj", "model.layers.40.mlp.experts.50.gate_proj", "model.layers.40.mlp.experts.51.gate_proj", "model.layers.40.mlp.experts.52.gate_proj", "model.layers.40.mlp.experts.53.gate_proj", "model.layers.40.mlp.experts.54.gate_proj", "model.layers.40.mlp.experts.55.gate_proj", "model.layers.40.mlp.experts.56.gate_proj", "model.layers.40.mlp.experts.57.gate_proj", "model.layers.40.mlp.experts.58.gate_proj", "model.layers.40.mlp.experts.59.gate_proj", "model.layers.40.mlp.experts.60.gate_proj", "model.layers.40.mlp.experts.61.gate_proj", "model.layers.40.mlp.experts.62.gate_proj", "model.layers.40.mlp.experts.63.gate_proj", "model.layers.40.mlp.experts.64.gate_proj", "model.layers.40.mlp.experts.65.gate_proj", "model.layers.40.mlp.experts.66.gate_proj", "model.layers.40.mlp.experts.67.gate_proj", "model.layers.40.mlp.experts.68.gate_proj", "model.layers.40.mlp.experts.69.gate_proj", "model.layers.40.mlp.experts.70.gate_proj", "model.layers.40.mlp.experts.71.gate_proj", "model.layers.40.mlp.experts.72.gate_proj", "model.layers.40.mlp.experts.73.gate_proj", "model.layers.40.mlp.experts.74.gate_proj", "model.layers.40.mlp.experts.75.gate_proj", "model.layers.40.mlp.experts.76.gate_proj", "model.layers.40.mlp.experts.77.gate_proj", "model.layers.40.mlp.experts.78.gate_proj", "model.layers.40.mlp.experts.79.gate_proj", "model.layers.40.mlp.experts.80.gate_proj", "model.layers.40.mlp.experts.81.gate_proj", "model.layers.40.mlp.experts.82.gate_proj", "model.layers.40.mlp.experts.83.gate_proj", "model.layers.40.mlp.experts.84.gate_proj", "model.layers.40.mlp.experts.85.gate_proj", "model.layers.40.mlp.experts.86.gate_proj", "model.layers.40.mlp.experts.87.gate_proj", "model.layers.40.mlp.experts.88.gate_proj", "model.layers.40.mlp.experts.89.gate_proj", "model.layers.40.mlp.experts.90.gate_proj", "model.layers.40.mlp.experts.91.gate_proj", "model.layers.40.mlp.experts.92.gate_proj", "model.layers.40.mlp.experts.93.gate_proj", "model.layers.40.mlp.experts.94.gate_proj", "model.layers.40.mlp.experts.95.gate_proj", "model.layers.40.mlp.experts.96.gate_proj", "model.layers.40.mlp.experts.97.gate_proj", "model.layers.40.mlp.experts.98.gate_proj", "model.layers.40.mlp.experts.99.gate_proj", "model.layers.40.mlp.experts.100.gate_proj", "model.layers.40.mlp.experts.101.gate_proj", "model.layers.40.mlp.experts.102.gate_proj", "model.layers.40.mlp.experts.103.gate_proj", "model.layers.40.mlp.experts.104.gate_proj", "model.layers.40.mlp.experts.105.gate_proj", "model.layers.40.mlp.experts.106.gate_proj", "model.layers.40.mlp.experts.107.gate_proj", "model.layers.40.mlp.experts.108.gate_proj", "model.layers.40.mlp.experts.109.gate_proj", "model.layers.40.mlp.experts.110.gate_proj", "model.layers.40.mlp.experts.111.gate_proj", "model.layers.40.mlp.experts.112.gate_proj", "model.layers.40.mlp.experts.113.gate_proj", "model.layers.40.mlp.experts.114.gate_proj", "model.layers.40.mlp.experts.115.gate_proj", "model.layers.40.mlp.experts.116.gate_proj", "model.layers.40.mlp.experts.117.gate_proj", "model.layers.40.mlp.experts.118.gate_proj", "model.layers.40.mlp.experts.119.gate_proj", "model.layers.40.mlp.experts.120.gate_proj", "model.layers.40.mlp.experts.121.gate_proj", "model.layers.40.mlp.experts.122.gate_proj", "model.layers.40.mlp.experts.123.gate_proj", "model.layers.40.mlp.experts.124.gate_proj", "model.layers.40.mlp.experts.125.gate_proj", "model.layers.40.mlp.experts.126.gate_proj", "model.layers.40.mlp.experts.127.gate_proj", "model.layers.40.mlp.experts.128.gate_proj", "model.layers.40.mlp.experts.129.gate_proj", "model.layers.40.mlp.experts.130.gate_proj", "model.layers.40.mlp.experts.131.gate_proj", "model.layers.40.mlp.experts.132.gate_proj", "model.layers.40.mlp.experts.133.gate_proj", "model.layers.40.mlp.experts.134.gate_proj", "model.layers.40.mlp.experts.135.gate_proj", "model.layers.40.mlp.experts.136.gate_proj", "model.layers.40.mlp.experts.137.gate_proj", "model.layers.40.mlp.experts.138.gate_proj", "model.layers.40.mlp.experts.139.gate_proj", "model.layers.40.mlp.experts.140.gate_proj", "model.layers.40.mlp.experts.141.gate_proj", "model.layers.40.mlp.experts.142.gate_proj", "model.layers.40.mlp.experts.143.gate_proj", "model.layers.40.mlp.experts.144.gate_proj", "model.layers.40.mlp.experts.145.gate_proj", "model.layers.40.mlp.experts.146.gate_proj", "model.layers.40.mlp.experts.147.gate_proj", "model.layers.40.mlp.experts.148.gate_proj", "model.layers.40.mlp.experts.149.gate_proj", "model.layers.40.mlp.experts.150.gate_proj", "model.layers.40.mlp.experts.151.gate_proj", "model.layers.40.mlp.experts.152.gate_proj", "model.layers.40.mlp.experts.153.gate_proj", "model.layers.40.mlp.experts.154.gate_proj", "model.layers.40.mlp.experts.155.gate_proj", "model.layers.40.mlp.experts.156.gate_proj", "model.layers.40.mlp.experts.157.gate_proj", "model.layers.40.mlp.experts.158.gate_proj", "model.layers.40.mlp.experts.159.gate_proj", "model.layers.40.mlp.experts.0.up_proj", "model.layers.40.mlp.experts.1.up_proj", "model.layers.40.mlp.experts.2.up_proj", "model.layers.40.mlp.experts.3.up_proj", "model.layers.40.mlp.experts.4.up_proj", "model.layers.40.mlp.experts.5.up_proj", "model.layers.40.mlp.experts.6.up_proj", "model.layers.40.mlp.experts.7.up_proj", "model.layers.40.mlp.experts.8.up_proj", "model.layers.40.mlp.experts.9.up_proj", "model.layers.40.mlp.experts.10.up_proj", "model.layers.40.mlp.experts.11.up_proj", "model.layers.40.mlp.experts.12.up_proj", "model.layers.40.mlp.experts.13.up_proj", "model.layers.40.mlp.experts.14.up_proj", "model.layers.40.mlp.experts.15.up_proj", "model.layers.40.mlp.experts.16.up_proj", "model.layers.40.mlp.experts.17.up_proj", "model.layers.40.mlp.experts.18.up_proj", "model.layers.40.mlp.experts.19.up_proj", "model.layers.40.mlp.experts.20.up_proj", "model.layers.40.mlp.experts.21.up_proj", "model.layers.40.mlp.experts.22.up_proj", "model.layers.40.mlp.experts.23.up_proj", "model.layers.40.mlp.experts.24.up_proj", "model.layers.40.mlp.experts.25.up_proj", "model.layers.40.mlp.experts.26.up_proj", "model.layers.40.mlp.experts.27.up_proj", "model.layers.40.mlp.experts.28.up_proj", "model.layers.40.mlp.experts.29.up_proj", "model.layers.40.mlp.experts.30.up_proj", "model.layers.40.mlp.experts.31.up_proj", "model.layers.40.mlp.experts.32.up_proj", "model.layers.40.mlp.experts.33.up_proj", "model.layers.40.mlp.experts.34.up_proj", "model.layers.40.mlp.experts.35.up_proj", "model.layers.40.mlp.experts.36.up_proj", "model.layers.40.mlp.experts.37.up_proj", "model.layers.40.mlp.experts.38.up_proj", "model.layers.40.mlp.experts.39.up_proj", "model.layers.40.mlp.experts.40.up_proj", "model.layers.40.mlp.experts.41.up_proj", "model.layers.40.mlp.experts.42.up_proj", "model.layers.40.mlp.experts.43.up_proj", "model.layers.40.mlp.experts.44.up_proj", "model.layers.40.mlp.experts.45.up_proj", "model.layers.40.mlp.experts.46.up_proj", "model.layers.40.mlp.experts.47.up_proj", "model.layers.40.mlp.experts.48.up_proj", "model.layers.40.mlp.experts.49.up_proj", "model.layers.40.mlp.experts.50.up_proj", "model.layers.40.mlp.experts.51.up_proj", "model.layers.40.mlp.experts.52.up_proj", "model.layers.40.mlp.experts.53.up_proj", "model.layers.40.mlp.experts.54.up_proj", "model.layers.40.mlp.experts.55.up_proj", "model.layers.40.mlp.experts.56.up_proj", "model.layers.40.mlp.experts.57.up_proj", "model.layers.40.mlp.experts.58.up_proj", "model.layers.40.mlp.experts.59.up_proj", "model.layers.40.mlp.experts.60.up_proj", "model.layers.40.mlp.experts.61.up_proj", "model.layers.40.mlp.experts.62.up_proj", "model.layers.40.mlp.experts.63.up_proj", "model.layers.40.mlp.experts.64.up_proj", "model.layers.40.mlp.experts.65.up_proj", "model.layers.40.mlp.experts.66.up_proj", "model.layers.40.mlp.experts.67.up_proj", "model.layers.40.mlp.experts.68.up_proj", "model.layers.40.mlp.experts.69.up_proj", "model.layers.40.mlp.experts.70.up_proj", "model.layers.40.mlp.experts.71.up_proj", "model.layers.40.mlp.experts.72.up_proj", "model.layers.40.mlp.experts.73.up_proj", "model.layers.40.mlp.experts.74.up_proj", "model.layers.40.mlp.experts.75.up_proj", "model.layers.40.mlp.experts.76.up_proj", "model.layers.40.mlp.experts.77.up_proj", "model.layers.40.mlp.experts.78.up_proj", "model.layers.40.mlp.experts.79.up_proj", "model.layers.40.mlp.experts.80.up_proj", "model.layers.40.mlp.experts.81.up_proj", "model.layers.40.mlp.experts.82.up_proj", "model.layers.40.mlp.experts.83.up_proj", "model.layers.40.mlp.experts.84.up_proj", "model.layers.40.mlp.experts.85.up_proj", "model.layers.40.mlp.experts.86.up_proj", "model.layers.40.mlp.experts.87.up_proj", "model.layers.40.mlp.experts.88.up_proj", "model.layers.40.mlp.experts.89.up_proj", "model.layers.40.mlp.experts.90.up_proj", "model.layers.40.mlp.experts.91.up_proj", "model.layers.40.mlp.experts.92.up_proj", "model.layers.40.mlp.experts.93.up_proj", "model.layers.40.mlp.experts.94.up_proj", "model.layers.40.mlp.experts.95.up_proj", "model.layers.40.mlp.experts.96.up_proj", "model.layers.40.mlp.experts.97.up_proj", "model.layers.40.mlp.experts.98.up_proj", "model.layers.40.mlp.experts.99.up_proj", "model.layers.40.mlp.experts.100.up_proj", "model.layers.40.mlp.experts.101.up_proj", "model.layers.40.mlp.experts.102.up_proj", "model.layers.40.mlp.experts.103.up_proj", "model.layers.40.mlp.experts.104.up_proj", "model.layers.40.mlp.experts.105.up_proj", "model.layers.40.mlp.experts.106.up_proj", "model.layers.40.mlp.experts.107.up_proj", "model.layers.40.mlp.experts.108.up_proj", "model.layers.40.mlp.experts.109.up_proj", "model.layers.40.mlp.experts.110.up_proj", "model.layers.40.mlp.experts.111.up_proj", "model.layers.40.mlp.experts.112.up_proj", "model.layers.40.mlp.experts.113.up_proj", "model.layers.40.mlp.experts.114.up_proj", "model.layers.40.mlp.experts.115.up_proj", "model.layers.40.mlp.experts.116.up_proj", "model.layers.40.mlp.experts.117.up_proj", "model.layers.40.mlp.experts.118.up_proj", "model.layers.40.mlp.experts.119.up_proj", "model.layers.40.mlp.experts.120.up_proj", "model.layers.40.mlp.experts.121.up_proj", "model.layers.40.mlp.experts.122.up_proj", "model.layers.40.mlp.experts.123.up_proj", "model.layers.40.mlp.experts.124.up_proj", "model.layers.40.mlp.experts.125.up_proj", "model.layers.40.mlp.experts.126.up_proj", "model.layers.40.mlp.experts.127.up_proj", "model.layers.40.mlp.experts.128.up_proj", "model.layers.40.mlp.experts.129.up_proj", "model.layers.40.mlp.experts.130.up_proj", "model.layers.40.mlp.experts.131.up_proj", "model.layers.40.mlp.experts.132.up_proj", "model.layers.40.mlp.experts.133.up_proj", "model.layers.40.mlp.experts.134.up_proj", "model.layers.40.mlp.experts.135.up_proj", "model.layers.40.mlp.experts.136.up_proj", "model.layers.40.mlp.experts.137.up_proj", "model.layers.40.mlp.experts.138.up_proj", "model.layers.40.mlp.experts.139.up_proj", "model.layers.40.mlp.experts.140.up_proj", "model.layers.40.mlp.experts.141.up_proj", "model.layers.40.mlp.experts.142.up_proj", "model.layers.40.mlp.experts.143.up_proj", "model.layers.40.mlp.experts.144.up_proj", "model.layers.40.mlp.experts.145.up_proj", "model.layers.40.mlp.experts.146.up_proj", "model.layers.40.mlp.experts.147.up_proj", "model.layers.40.mlp.experts.148.up_proj", "model.layers.40.mlp.experts.149.up_proj", "model.layers.40.mlp.experts.150.up_proj", "model.layers.40.mlp.experts.151.up_proj", "model.layers.40.mlp.experts.152.up_proj", "model.layers.40.mlp.experts.153.up_proj", "model.layers.40.mlp.experts.154.up_proj", "model.layers.40.mlp.experts.155.up_proj", "model.layers.40.mlp.experts.156.up_proj", "model.layers.40.mlp.experts.157.up_proj", "model.layers.40.mlp.experts.158.up_proj", "model.layers.40.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.822237391024828e-05, "dbits": 2516582400 }, { "dkld": -2.739834599196911e-05, "dbits": 5033164800 } ] }, { "idx": 242, "layers": [ "model.layers.40.mlp.experts.0.down_proj", "model.layers.40.mlp.experts.1.down_proj", "model.layers.40.mlp.experts.2.down_proj", "model.layers.40.mlp.experts.3.down_proj", "model.layers.40.mlp.experts.4.down_proj", "model.layers.40.mlp.experts.5.down_proj", "model.layers.40.mlp.experts.6.down_proj", "model.layers.40.mlp.experts.7.down_proj", "model.layers.40.mlp.experts.8.down_proj", "model.layers.40.mlp.experts.9.down_proj", "model.layers.40.mlp.experts.10.down_proj", "model.layers.40.mlp.experts.11.down_proj", "model.layers.40.mlp.experts.12.down_proj", "model.layers.40.mlp.experts.13.down_proj", "model.layers.40.mlp.experts.14.down_proj", "model.layers.40.mlp.experts.15.down_proj", "model.layers.40.mlp.experts.16.down_proj", "model.layers.40.mlp.experts.17.down_proj", "model.layers.40.mlp.experts.18.down_proj", "model.layers.40.mlp.experts.19.down_proj", "model.layers.40.mlp.experts.20.down_proj", "model.layers.40.mlp.experts.21.down_proj", "model.layers.40.mlp.experts.22.down_proj", "model.layers.40.mlp.experts.23.down_proj", "model.layers.40.mlp.experts.24.down_proj", "model.layers.40.mlp.experts.25.down_proj", "model.layers.40.mlp.experts.26.down_proj", "model.layers.40.mlp.experts.27.down_proj", "model.layers.40.mlp.experts.28.down_proj", "model.layers.40.mlp.experts.29.down_proj", "model.layers.40.mlp.experts.30.down_proj", "model.layers.40.mlp.experts.31.down_proj", "model.layers.40.mlp.experts.32.down_proj", "model.layers.40.mlp.experts.33.down_proj", "model.layers.40.mlp.experts.34.down_proj", "model.layers.40.mlp.experts.35.down_proj", "model.layers.40.mlp.experts.36.down_proj", "model.layers.40.mlp.experts.37.down_proj", "model.layers.40.mlp.experts.38.down_proj", "model.layers.40.mlp.experts.39.down_proj", "model.layers.40.mlp.experts.40.down_proj", "model.layers.40.mlp.experts.41.down_proj", "model.layers.40.mlp.experts.42.down_proj", "model.layers.40.mlp.experts.43.down_proj", "model.layers.40.mlp.experts.44.down_proj", "model.layers.40.mlp.experts.45.down_proj", "model.layers.40.mlp.experts.46.down_proj", "model.layers.40.mlp.experts.47.down_proj", "model.layers.40.mlp.experts.48.down_proj", "model.layers.40.mlp.experts.49.down_proj", "model.layers.40.mlp.experts.50.down_proj", "model.layers.40.mlp.experts.51.down_proj", "model.layers.40.mlp.experts.52.down_proj", "model.layers.40.mlp.experts.53.down_proj", "model.layers.40.mlp.experts.54.down_proj", "model.layers.40.mlp.experts.55.down_proj", "model.layers.40.mlp.experts.56.down_proj", "model.layers.40.mlp.experts.57.down_proj", "model.layers.40.mlp.experts.58.down_proj", "model.layers.40.mlp.experts.59.down_proj", "model.layers.40.mlp.experts.60.down_proj", "model.layers.40.mlp.experts.61.down_proj", "model.layers.40.mlp.experts.62.down_proj", "model.layers.40.mlp.experts.63.down_proj", "model.layers.40.mlp.experts.64.down_proj", "model.layers.40.mlp.experts.65.down_proj", "model.layers.40.mlp.experts.66.down_proj", "model.layers.40.mlp.experts.67.down_proj", "model.layers.40.mlp.experts.68.down_proj", "model.layers.40.mlp.experts.69.down_proj", "model.layers.40.mlp.experts.70.down_proj", "model.layers.40.mlp.experts.71.down_proj", "model.layers.40.mlp.experts.72.down_proj", "model.layers.40.mlp.experts.73.down_proj", "model.layers.40.mlp.experts.74.down_proj", "model.layers.40.mlp.experts.75.down_proj", "model.layers.40.mlp.experts.76.down_proj", "model.layers.40.mlp.experts.77.down_proj", "model.layers.40.mlp.experts.78.down_proj", "model.layers.40.mlp.experts.79.down_proj", "model.layers.40.mlp.experts.80.down_proj", "model.layers.40.mlp.experts.81.down_proj", "model.layers.40.mlp.experts.82.down_proj", "model.layers.40.mlp.experts.83.down_proj", "model.layers.40.mlp.experts.84.down_proj", "model.layers.40.mlp.experts.85.down_proj", "model.layers.40.mlp.experts.86.down_proj", "model.layers.40.mlp.experts.87.down_proj", "model.layers.40.mlp.experts.88.down_proj", "model.layers.40.mlp.experts.89.down_proj", "model.layers.40.mlp.experts.90.down_proj", "model.layers.40.mlp.experts.91.down_proj", "model.layers.40.mlp.experts.92.down_proj", "model.layers.40.mlp.experts.93.down_proj", "model.layers.40.mlp.experts.94.down_proj", "model.layers.40.mlp.experts.95.down_proj", "model.layers.40.mlp.experts.96.down_proj", "model.layers.40.mlp.experts.97.down_proj", "model.layers.40.mlp.experts.98.down_proj", "model.layers.40.mlp.experts.99.down_proj", "model.layers.40.mlp.experts.100.down_proj", "model.layers.40.mlp.experts.101.down_proj", "model.layers.40.mlp.experts.102.down_proj", "model.layers.40.mlp.experts.103.down_proj", "model.layers.40.mlp.experts.104.down_proj", "model.layers.40.mlp.experts.105.down_proj", "model.layers.40.mlp.experts.106.down_proj", "model.layers.40.mlp.experts.107.down_proj", "model.layers.40.mlp.experts.108.down_proj", "model.layers.40.mlp.experts.109.down_proj", "model.layers.40.mlp.experts.110.down_proj", "model.layers.40.mlp.experts.111.down_proj", "model.layers.40.mlp.experts.112.down_proj", "model.layers.40.mlp.experts.113.down_proj", "model.layers.40.mlp.experts.114.down_proj", "model.layers.40.mlp.experts.115.down_proj", "model.layers.40.mlp.experts.116.down_proj", "model.layers.40.mlp.experts.117.down_proj", "model.layers.40.mlp.experts.118.down_proj", "model.layers.40.mlp.experts.119.down_proj", "model.layers.40.mlp.experts.120.down_proj", "model.layers.40.mlp.experts.121.down_proj", "model.layers.40.mlp.experts.122.down_proj", "model.layers.40.mlp.experts.123.down_proj", "model.layers.40.mlp.experts.124.down_proj", "model.layers.40.mlp.experts.125.down_proj", "model.layers.40.mlp.experts.126.down_proj", "model.layers.40.mlp.experts.127.down_proj", "model.layers.40.mlp.experts.128.down_proj", "model.layers.40.mlp.experts.129.down_proj", "model.layers.40.mlp.experts.130.down_proj", "model.layers.40.mlp.experts.131.down_proj", "model.layers.40.mlp.experts.132.down_proj", "model.layers.40.mlp.experts.133.down_proj", "model.layers.40.mlp.experts.134.down_proj", "model.layers.40.mlp.experts.135.down_proj", "model.layers.40.mlp.experts.136.down_proj", "model.layers.40.mlp.experts.137.down_proj", "model.layers.40.mlp.experts.138.down_proj", "model.layers.40.mlp.experts.139.down_proj", "model.layers.40.mlp.experts.140.down_proj", "model.layers.40.mlp.experts.141.down_proj", "model.layers.40.mlp.experts.142.down_proj", "model.layers.40.mlp.experts.143.down_proj", "model.layers.40.mlp.experts.144.down_proj", "model.layers.40.mlp.experts.145.down_proj", "model.layers.40.mlp.experts.146.down_proj", "model.layers.40.mlp.experts.147.down_proj", "model.layers.40.mlp.experts.148.down_proj", "model.layers.40.mlp.experts.149.down_proj", "model.layers.40.mlp.experts.150.down_proj", "model.layers.40.mlp.experts.151.down_proj", "model.layers.40.mlp.experts.152.down_proj", "model.layers.40.mlp.experts.153.down_proj", "model.layers.40.mlp.experts.154.down_proj", "model.layers.40.mlp.experts.155.down_proj", "model.layers.40.mlp.experts.156.down_proj", "model.layers.40.mlp.experts.157.down_proj", "model.layers.40.mlp.experts.158.down_proj", "model.layers.40.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -7.320956792682305e-05, "dbits": 1258291200 }, { "dkld": -5.212458781897987e-05, "dbits": 2516582400 } ] }, { "idx": 243, "layers": [ "model.layers.41.self_attn.q_proj" ], "candidates": [ { "dkld": -1.188698224723235e-05, "dbits": 62914560 }, { "dkld": 1.3996171765029777e-05, "dbits": 125829120 } ] }, { "idx": 244, "layers": [ "model.layers.41.self_attn.k_proj", "model.layers.41.self_attn.v_proj" ], "candidates": [ { "dkld": -8.400483056902885e-05, "dbits": 10485760 }, { "dkld": -0.00010842937044799189, "dbits": 20971520 } ] }, { "idx": 245, "layers": [ "model.layers.41.self_attn.o_proj" ], "candidates": [ { "dkld": -1.5295110642910004e-05, "dbits": 62914560 }, { "dkld": -3.6019529215990456e-05, "dbits": 125829120 } ] }, { "idx": 246, "layers": [ "model.layers.41.mlp.shared_experts.gate_proj", "model.layers.41.mlp.shared_experts.up_proj", "model.layers.41.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 8.584808092564414e-05, "dbits": 23592960 }, { "dkld": 3.479444421827793e-05, "dbits": 47185920 } ] }, { "idx": 247, "layers": [ "model.layers.41.mlp.experts.0.gate_proj", "model.layers.41.mlp.experts.1.gate_proj", "model.layers.41.mlp.experts.2.gate_proj", "model.layers.41.mlp.experts.3.gate_proj", "model.layers.41.mlp.experts.4.gate_proj", "model.layers.41.mlp.experts.5.gate_proj", "model.layers.41.mlp.experts.6.gate_proj", "model.layers.41.mlp.experts.7.gate_proj", "model.layers.41.mlp.experts.8.gate_proj", "model.layers.41.mlp.experts.9.gate_proj", "model.layers.41.mlp.experts.10.gate_proj", "model.layers.41.mlp.experts.11.gate_proj", "model.layers.41.mlp.experts.12.gate_proj", "model.layers.41.mlp.experts.13.gate_proj", "model.layers.41.mlp.experts.14.gate_proj", "model.layers.41.mlp.experts.15.gate_proj", "model.layers.41.mlp.experts.16.gate_proj", "model.layers.41.mlp.experts.17.gate_proj", "model.layers.41.mlp.experts.18.gate_proj", "model.layers.41.mlp.experts.19.gate_proj", "model.layers.41.mlp.experts.20.gate_proj", "model.layers.41.mlp.experts.21.gate_proj", "model.layers.41.mlp.experts.22.gate_proj", "model.layers.41.mlp.experts.23.gate_proj", "model.layers.41.mlp.experts.24.gate_proj", "model.layers.41.mlp.experts.25.gate_proj", "model.layers.41.mlp.experts.26.gate_proj", "model.layers.41.mlp.experts.27.gate_proj", "model.layers.41.mlp.experts.28.gate_proj", "model.layers.41.mlp.experts.29.gate_proj", "model.layers.41.mlp.experts.30.gate_proj", "model.layers.41.mlp.experts.31.gate_proj", "model.layers.41.mlp.experts.32.gate_proj", "model.layers.41.mlp.experts.33.gate_proj", "model.layers.41.mlp.experts.34.gate_proj", "model.layers.41.mlp.experts.35.gate_proj", "model.layers.41.mlp.experts.36.gate_proj", "model.layers.41.mlp.experts.37.gate_proj", "model.layers.41.mlp.experts.38.gate_proj", "model.layers.41.mlp.experts.39.gate_proj", "model.layers.41.mlp.experts.40.gate_proj", "model.layers.41.mlp.experts.41.gate_proj", "model.layers.41.mlp.experts.42.gate_proj", "model.layers.41.mlp.experts.43.gate_proj", "model.layers.41.mlp.experts.44.gate_proj", "model.layers.41.mlp.experts.45.gate_proj", "model.layers.41.mlp.experts.46.gate_proj", "model.layers.41.mlp.experts.47.gate_proj", "model.layers.41.mlp.experts.48.gate_proj", "model.layers.41.mlp.experts.49.gate_proj", "model.layers.41.mlp.experts.50.gate_proj", "model.layers.41.mlp.experts.51.gate_proj", "model.layers.41.mlp.experts.52.gate_proj", "model.layers.41.mlp.experts.53.gate_proj", "model.layers.41.mlp.experts.54.gate_proj", "model.layers.41.mlp.experts.55.gate_proj", "model.layers.41.mlp.experts.56.gate_proj", "model.layers.41.mlp.experts.57.gate_proj", "model.layers.41.mlp.experts.58.gate_proj", "model.layers.41.mlp.experts.59.gate_proj", "model.layers.41.mlp.experts.60.gate_proj", "model.layers.41.mlp.experts.61.gate_proj", "model.layers.41.mlp.experts.62.gate_proj", "model.layers.41.mlp.experts.63.gate_proj", "model.layers.41.mlp.experts.64.gate_proj", "model.layers.41.mlp.experts.65.gate_proj", "model.layers.41.mlp.experts.66.gate_proj", "model.layers.41.mlp.experts.67.gate_proj", "model.layers.41.mlp.experts.68.gate_proj", "model.layers.41.mlp.experts.69.gate_proj", "model.layers.41.mlp.experts.70.gate_proj", "model.layers.41.mlp.experts.71.gate_proj", "model.layers.41.mlp.experts.72.gate_proj", "model.layers.41.mlp.experts.73.gate_proj", "model.layers.41.mlp.experts.74.gate_proj", "model.layers.41.mlp.experts.75.gate_proj", "model.layers.41.mlp.experts.76.gate_proj", "model.layers.41.mlp.experts.77.gate_proj", "model.layers.41.mlp.experts.78.gate_proj", "model.layers.41.mlp.experts.79.gate_proj", "model.layers.41.mlp.experts.80.gate_proj", "model.layers.41.mlp.experts.81.gate_proj", "model.layers.41.mlp.experts.82.gate_proj", "model.layers.41.mlp.experts.83.gate_proj", "model.layers.41.mlp.experts.84.gate_proj", "model.layers.41.mlp.experts.85.gate_proj", "model.layers.41.mlp.experts.86.gate_proj", "model.layers.41.mlp.experts.87.gate_proj", "model.layers.41.mlp.experts.88.gate_proj", "model.layers.41.mlp.experts.89.gate_proj", "model.layers.41.mlp.experts.90.gate_proj", "model.layers.41.mlp.experts.91.gate_proj", "model.layers.41.mlp.experts.92.gate_proj", "model.layers.41.mlp.experts.93.gate_proj", "model.layers.41.mlp.experts.94.gate_proj", "model.layers.41.mlp.experts.95.gate_proj", "model.layers.41.mlp.experts.96.gate_proj", "model.layers.41.mlp.experts.97.gate_proj", "model.layers.41.mlp.experts.98.gate_proj", "model.layers.41.mlp.experts.99.gate_proj", "model.layers.41.mlp.experts.100.gate_proj", "model.layers.41.mlp.experts.101.gate_proj", "model.layers.41.mlp.experts.102.gate_proj", "model.layers.41.mlp.experts.103.gate_proj", "model.layers.41.mlp.experts.104.gate_proj", "model.layers.41.mlp.experts.105.gate_proj", "model.layers.41.mlp.experts.106.gate_proj", "model.layers.41.mlp.experts.107.gate_proj", "model.layers.41.mlp.experts.108.gate_proj", "model.layers.41.mlp.experts.109.gate_proj", "model.layers.41.mlp.experts.110.gate_proj", "model.layers.41.mlp.experts.111.gate_proj", "model.layers.41.mlp.experts.112.gate_proj", "model.layers.41.mlp.experts.113.gate_proj", "model.layers.41.mlp.experts.114.gate_proj", "model.layers.41.mlp.experts.115.gate_proj", "model.layers.41.mlp.experts.116.gate_proj", "model.layers.41.mlp.experts.117.gate_proj", "model.layers.41.mlp.experts.118.gate_proj", "model.layers.41.mlp.experts.119.gate_proj", "model.layers.41.mlp.experts.120.gate_proj", "model.layers.41.mlp.experts.121.gate_proj", "model.layers.41.mlp.experts.122.gate_proj", "model.layers.41.mlp.experts.123.gate_proj", "model.layers.41.mlp.experts.124.gate_proj", "model.layers.41.mlp.experts.125.gate_proj", "model.layers.41.mlp.experts.126.gate_proj", "model.layers.41.mlp.experts.127.gate_proj", "model.layers.41.mlp.experts.128.gate_proj", "model.layers.41.mlp.experts.129.gate_proj", "model.layers.41.mlp.experts.130.gate_proj", "model.layers.41.mlp.experts.131.gate_proj", "model.layers.41.mlp.experts.132.gate_proj", "model.layers.41.mlp.experts.133.gate_proj", "model.layers.41.mlp.experts.134.gate_proj", "model.layers.41.mlp.experts.135.gate_proj", "model.layers.41.mlp.experts.136.gate_proj", "model.layers.41.mlp.experts.137.gate_proj", "model.layers.41.mlp.experts.138.gate_proj", "model.layers.41.mlp.experts.139.gate_proj", "model.layers.41.mlp.experts.140.gate_proj", "model.layers.41.mlp.experts.141.gate_proj", "model.layers.41.mlp.experts.142.gate_proj", "model.layers.41.mlp.experts.143.gate_proj", "model.layers.41.mlp.experts.144.gate_proj", "model.layers.41.mlp.experts.145.gate_proj", "model.layers.41.mlp.experts.146.gate_proj", "model.layers.41.mlp.experts.147.gate_proj", "model.layers.41.mlp.experts.148.gate_proj", "model.layers.41.mlp.experts.149.gate_proj", "model.layers.41.mlp.experts.150.gate_proj", "model.layers.41.mlp.experts.151.gate_proj", "model.layers.41.mlp.experts.152.gate_proj", "model.layers.41.mlp.experts.153.gate_proj", "model.layers.41.mlp.experts.154.gate_proj", "model.layers.41.mlp.experts.155.gate_proj", "model.layers.41.mlp.experts.156.gate_proj", "model.layers.41.mlp.experts.157.gate_proj", "model.layers.41.mlp.experts.158.gate_proj", "model.layers.41.mlp.experts.159.gate_proj", "model.layers.41.mlp.experts.0.up_proj", "model.layers.41.mlp.experts.1.up_proj", "model.layers.41.mlp.experts.2.up_proj", "model.layers.41.mlp.experts.3.up_proj", "model.layers.41.mlp.experts.4.up_proj", "model.layers.41.mlp.experts.5.up_proj", "model.layers.41.mlp.experts.6.up_proj", "model.layers.41.mlp.experts.7.up_proj", "model.layers.41.mlp.experts.8.up_proj", "model.layers.41.mlp.experts.9.up_proj", "model.layers.41.mlp.experts.10.up_proj", "model.layers.41.mlp.experts.11.up_proj", "model.layers.41.mlp.experts.12.up_proj", "model.layers.41.mlp.experts.13.up_proj", "model.layers.41.mlp.experts.14.up_proj", "model.layers.41.mlp.experts.15.up_proj", "model.layers.41.mlp.experts.16.up_proj", "model.layers.41.mlp.experts.17.up_proj", "model.layers.41.mlp.experts.18.up_proj", "model.layers.41.mlp.experts.19.up_proj", "model.layers.41.mlp.experts.20.up_proj", "model.layers.41.mlp.experts.21.up_proj", "model.layers.41.mlp.experts.22.up_proj", "model.layers.41.mlp.experts.23.up_proj", "model.layers.41.mlp.experts.24.up_proj", "model.layers.41.mlp.experts.25.up_proj", "model.layers.41.mlp.experts.26.up_proj", "model.layers.41.mlp.experts.27.up_proj", "model.layers.41.mlp.experts.28.up_proj", "model.layers.41.mlp.experts.29.up_proj", "model.layers.41.mlp.experts.30.up_proj", "model.layers.41.mlp.experts.31.up_proj", "model.layers.41.mlp.experts.32.up_proj", "model.layers.41.mlp.experts.33.up_proj", "model.layers.41.mlp.experts.34.up_proj", "model.layers.41.mlp.experts.35.up_proj", "model.layers.41.mlp.experts.36.up_proj", "model.layers.41.mlp.experts.37.up_proj", "model.layers.41.mlp.experts.38.up_proj", "model.layers.41.mlp.experts.39.up_proj", "model.layers.41.mlp.experts.40.up_proj", "model.layers.41.mlp.experts.41.up_proj", "model.layers.41.mlp.experts.42.up_proj", "model.layers.41.mlp.experts.43.up_proj", "model.layers.41.mlp.experts.44.up_proj", "model.layers.41.mlp.experts.45.up_proj", "model.layers.41.mlp.experts.46.up_proj", "model.layers.41.mlp.experts.47.up_proj", "model.layers.41.mlp.experts.48.up_proj", "model.layers.41.mlp.experts.49.up_proj", "model.layers.41.mlp.experts.50.up_proj", "model.layers.41.mlp.experts.51.up_proj", "model.layers.41.mlp.experts.52.up_proj", "model.layers.41.mlp.experts.53.up_proj", "model.layers.41.mlp.experts.54.up_proj", "model.layers.41.mlp.experts.55.up_proj", "model.layers.41.mlp.experts.56.up_proj", "model.layers.41.mlp.experts.57.up_proj", "model.layers.41.mlp.experts.58.up_proj", "model.layers.41.mlp.experts.59.up_proj", "model.layers.41.mlp.experts.60.up_proj", "model.layers.41.mlp.experts.61.up_proj", "model.layers.41.mlp.experts.62.up_proj", "model.layers.41.mlp.experts.63.up_proj", "model.layers.41.mlp.experts.64.up_proj", "model.layers.41.mlp.experts.65.up_proj", "model.layers.41.mlp.experts.66.up_proj", "model.layers.41.mlp.experts.67.up_proj", "model.layers.41.mlp.experts.68.up_proj", "model.layers.41.mlp.experts.69.up_proj", "model.layers.41.mlp.experts.70.up_proj", "model.layers.41.mlp.experts.71.up_proj", "model.layers.41.mlp.experts.72.up_proj", "model.layers.41.mlp.experts.73.up_proj", "model.layers.41.mlp.experts.74.up_proj", "model.layers.41.mlp.experts.75.up_proj", "model.layers.41.mlp.experts.76.up_proj", "model.layers.41.mlp.experts.77.up_proj", "model.layers.41.mlp.experts.78.up_proj", "model.layers.41.mlp.experts.79.up_proj", "model.layers.41.mlp.experts.80.up_proj", "model.layers.41.mlp.experts.81.up_proj", "model.layers.41.mlp.experts.82.up_proj", "model.layers.41.mlp.experts.83.up_proj", "model.layers.41.mlp.experts.84.up_proj", "model.layers.41.mlp.experts.85.up_proj", "model.layers.41.mlp.experts.86.up_proj", "model.layers.41.mlp.experts.87.up_proj", "model.layers.41.mlp.experts.88.up_proj", "model.layers.41.mlp.experts.89.up_proj", "model.layers.41.mlp.experts.90.up_proj", "model.layers.41.mlp.experts.91.up_proj", "model.layers.41.mlp.experts.92.up_proj", "model.layers.41.mlp.experts.93.up_proj", "model.layers.41.mlp.experts.94.up_proj", "model.layers.41.mlp.experts.95.up_proj", "model.layers.41.mlp.experts.96.up_proj", "model.layers.41.mlp.experts.97.up_proj", "model.layers.41.mlp.experts.98.up_proj", "model.layers.41.mlp.experts.99.up_proj", "model.layers.41.mlp.experts.100.up_proj", "model.layers.41.mlp.experts.101.up_proj", "model.layers.41.mlp.experts.102.up_proj", "model.layers.41.mlp.experts.103.up_proj", "model.layers.41.mlp.experts.104.up_proj", "model.layers.41.mlp.experts.105.up_proj", "model.layers.41.mlp.experts.106.up_proj", "model.layers.41.mlp.experts.107.up_proj", "model.layers.41.mlp.experts.108.up_proj", "model.layers.41.mlp.experts.109.up_proj", "model.layers.41.mlp.experts.110.up_proj", "model.layers.41.mlp.experts.111.up_proj", "model.layers.41.mlp.experts.112.up_proj", "model.layers.41.mlp.experts.113.up_proj", "model.layers.41.mlp.experts.114.up_proj", "model.layers.41.mlp.experts.115.up_proj", "model.layers.41.mlp.experts.116.up_proj", "model.layers.41.mlp.experts.117.up_proj", "model.layers.41.mlp.experts.118.up_proj", "model.layers.41.mlp.experts.119.up_proj", "model.layers.41.mlp.experts.120.up_proj", "model.layers.41.mlp.experts.121.up_proj", "model.layers.41.mlp.experts.122.up_proj", "model.layers.41.mlp.experts.123.up_proj", "model.layers.41.mlp.experts.124.up_proj", "model.layers.41.mlp.experts.125.up_proj", "model.layers.41.mlp.experts.126.up_proj", "model.layers.41.mlp.experts.127.up_proj", "model.layers.41.mlp.experts.128.up_proj", "model.layers.41.mlp.experts.129.up_proj", "model.layers.41.mlp.experts.130.up_proj", "model.layers.41.mlp.experts.131.up_proj", "model.layers.41.mlp.experts.132.up_proj", "model.layers.41.mlp.experts.133.up_proj", "model.layers.41.mlp.experts.134.up_proj", "model.layers.41.mlp.experts.135.up_proj", "model.layers.41.mlp.experts.136.up_proj", "model.layers.41.mlp.experts.137.up_proj", "model.layers.41.mlp.experts.138.up_proj", "model.layers.41.mlp.experts.139.up_proj", "model.layers.41.mlp.experts.140.up_proj", "model.layers.41.mlp.experts.141.up_proj", "model.layers.41.mlp.experts.142.up_proj", "model.layers.41.mlp.experts.143.up_proj", "model.layers.41.mlp.experts.144.up_proj", "model.layers.41.mlp.experts.145.up_proj", "model.layers.41.mlp.experts.146.up_proj", "model.layers.41.mlp.experts.147.up_proj", "model.layers.41.mlp.experts.148.up_proj", "model.layers.41.mlp.experts.149.up_proj", "model.layers.41.mlp.experts.150.up_proj", "model.layers.41.mlp.experts.151.up_proj", "model.layers.41.mlp.experts.152.up_proj", "model.layers.41.mlp.experts.153.up_proj", "model.layers.41.mlp.experts.154.up_proj", "model.layers.41.mlp.experts.155.up_proj", "model.layers.41.mlp.experts.156.up_proj", "model.layers.41.mlp.experts.157.up_proj", "model.layers.41.mlp.experts.158.up_proj", "model.layers.41.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.1355721876024506e-05, "dbits": 2516582400 }, { "dkld": -3.7460797466337334e-05, "dbits": 5033164800 } ] }, { "idx": 248, "layers": [ "model.layers.41.mlp.experts.0.down_proj", "model.layers.41.mlp.experts.1.down_proj", "model.layers.41.mlp.experts.2.down_proj", "model.layers.41.mlp.experts.3.down_proj", "model.layers.41.mlp.experts.4.down_proj", "model.layers.41.mlp.experts.5.down_proj", "model.layers.41.mlp.experts.6.down_proj", "model.layers.41.mlp.experts.7.down_proj", "model.layers.41.mlp.experts.8.down_proj", "model.layers.41.mlp.experts.9.down_proj", "model.layers.41.mlp.experts.10.down_proj", "model.layers.41.mlp.experts.11.down_proj", "model.layers.41.mlp.experts.12.down_proj", "model.layers.41.mlp.experts.13.down_proj", "model.layers.41.mlp.experts.14.down_proj", "model.layers.41.mlp.experts.15.down_proj", "model.layers.41.mlp.experts.16.down_proj", "model.layers.41.mlp.experts.17.down_proj", "model.layers.41.mlp.experts.18.down_proj", "model.layers.41.mlp.experts.19.down_proj", "model.layers.41.mlp.experts.20.down_proj", "model.layers.41.mlp.experts.21.down_proj", "model.layers.41.mlp.experts.22.down_proj", "model.layers.41.mlp.experts.23.down_proj", "model.layers.41.mlp.experts.24.down_proj", "model.layers.41.mlp.experts.25.down_proj", "model.layers.41.mlp.experts.26.down_proj", "model.layers.41.mlp.experts.27.down_proj", "model.layers.41.mlp.experts.28.down_proj", "model.layers.41.mlp.experts.29.down_proj", "model.layers.41.mlp.experts.30.down_proj", "model.layers.41.mlp.experts.31.down_proj", "model.layers.41.mlp.experts.32.down_proj", "model.layers.41.mlp.experts.33.down_proj", "model.layers.41.mlp.experts.34.down_proj", "model.layers.41.mlp.experts.35.down_proj", "model.layers.41.mlp.experts.36.down_proj", "model.layers.41.mlp.experts.37.down_proj", "model.layers.41.mlp.experts.38.down_proj", "model.layers.41.mlp.experts.39.down_proj", "model.layers.41.mlp.experts.40.down_proj", "model.layers.41.mlp.experts.41.down_proj", "model.layers.41.mlp.experts.42.down_proj", "model.layers.41.mlp.experts.43.down_proj", "model.layers.41.mlp.experts.44.down_proj", "model.layers.41.mlp.experts.45.down_proj", "model.layers.41.mlp.experts.46.down_proj", "model.layers.41.mlp.experts.47.down_proj", "model.layers.41.mlp.experts.48.down_proj", "model.layers.41.mlp.experts.49.down_proj", "model.layers.41.mlp.experts.50.down_proj", "model.layers.41.mlp.experts.51.down_proj", "model.layers.41.mlp.experts.52.down_proj", "model.layers.41.mlp.experts.53.down_proj", "model.layers.41.mlp.experts.54.down_proj", "model.layers.41.mlp.experts.55.down_proj", "model.layers.41.mlp.experts.56.down_proj", "model.layers.41.mlp.experts.57.down_proj", "model.layers.41.mlp.experts.58.down_proj", "model.layers.41.mlp.experts.59.down_proj", "model.layers.41.mlp.experts.60.down_proj", "model.layers.41.mlp.experts.61.down_proj", "model.layers.41.mlp.experts.62.down_proj", "model.layers.41.mlp.experts.63.down_proj", "model.layers.41.mlp.experts.64.down_proj", "model.layers.41.mlp.experts.65.down_proj", "model.layers.41.mlp.experts.66.down_proj", "model.layers.41.mlp.experts.67.down_proj", "model.layers.41.mlp.experts.68.down_proj", "model.layers.41.mlp.experts.69.down_proj", "model.layers.41.mlp.experts.70.down_proj", "model.layers.41.mlp.experts.71.down_proj", "model.layers.41.mlp.experts.72.down_proj", "model.layers.41.mlp.experts.73.down_proj", "model.layers.41.mlp.experts.74.down_proj", "model.layers.41.mlp.experts.75.down_proj", "model.layers.41.mlp.experts.76.down_proj", "model.layers.41.mlp.experts.77.down_proj", "model.layers.41.mlp.experts.78.down_proj", "model.layers.41.mlp.experts.79.down_proj", "model.layers.41.mlp.experts.80.down_proj", "model.layers.41.mlp.experts.81.down_proj", "model.layers.41.mlp.experts.82.down_proj", "model.layers.41.mlp.experts.83.down_proj", "model.layers.41.mlp.experts.84.down_proj", "model.layers.41.mlp.experts.85.down_proj", "model.layers.41.mlp.experts.86.down_proj", "model.layers.41.mlp.experts.87.down_proj", "model.layers.41.mlp.experts.88.down_proj", "model.layers.41.mlp.experts.89.down_proj", "model.layers.41.mlp.experts.90.down_proj", "model.layers.41.mlp.experts.91.down_proj", "model.layers.41.mlp.experts.92.down_proj", "model.layers.41.mlp.experts.93.down_proj", "model.layers.41.mlp.experts.94.down_proj", "model.layers.41.mlp.experts.95.down_proj", "model.layers.41.mlp.experts.96.down_proj", "model.layers.41.mlp.experts.97.down_proj", "model.layers.41.mlp.experts.98.down_proj", "model.layers.41.mlp.experts.99.down_proj", "model.layers.41.mlp.experts.100.down_proj", "model.layers.41.mlp.experts.101.down_proj", "model.layers.41.mlp.experts.102.down_proj", "model.layers.41.mlp.experts.103.down_proj", "model.layers.41.mlp.experts.104.down_proj", "model.layers.41.mlp.experts.105.down_proj", "model.layers.41.mlp.experts.106.down_proj", "model.layers.41.mlp.experts.107.down_proj", "model.layers.41.mlp.experts.108.down_proj", "model.layers.41.mlp.experts.109.down_proj", "model.layers.41.mlp.experts.110.down_proj", "model.layers.41.mlp.experts.111.down_proj", "model.layers.41.mlp.experts.112.down_proj", "model.layers.41.mlp.experts.113.down_proj", "model.layers.41.mlp.experts.114.down_proj", "model.layers.41.mlp.experts.115.down_proj", "model.layers.41.mlp.experts.116.down_proj", "model.layers.41.mlp.experts.117.down_proj", "model.layers.41.mlp.experts.118.down_proj", "model.layers.41.mlp.experts.119.down_proj", "model.layers.41.mlp.experts.120.down_proj", "model.layers.41.mlp.experts.121.down_proj", "model.layers.41.mlp.experts.122.down_proj", "model.layers.41.mlp.experts.123.down_proj", "model.layers.41.mlp.experts.124.down_proj", "model.layers.41.mlp.experts.125.down_proj", "model.layers.41.mlp.experts.126.down_proj", "model.layers.41.mlp.experts.127.down_proj", "model.layers.41.mlp.experts.128.down_proj", "model.layers.41.mlp.experts.129.down_proj", "model.layers.41.mlp.experts.130.down_proj", "model.layers.41.mlp.experts.131.down_proj", "model.layers.41.mlp.experts.132.down_proj", "model.layers.41.mlp.experts.133.down_proj", "model.layers.41.mlp.experts.134.down_proj", "model.layers.41.mlp.experts.135.down_proj", "model.layers.41.mlp.experts.136.down_proj", "model.layers.41.mlp.experts.137.down_proj", "model.layers.41.mlp.experts.138.down_proj", "model.layers.41.mlp.experts.139.down_proj", "model.layers.41.mlp.experts.140.down_proj", "model.layers.41.mlp.experts.141.down_proj", "model.layers.41.mlp.experts.142.down_proj", "model.layers.41.mlp.experts.143.down_proj", "model.layers.41.mlp.experts.144.down_proj", "model.layers.41.mlp.experts.145.down_proj", "model.layers.41.mlp.experts.146.down_proj", "model.layers.41.mlp.experts.147.down_proj", "model.layers.41.mlp.experts.148.down_proj", "model.layers.41.mlp.experts.149.down_proj", "model.layers.41.mlp.experts.150.down_proj", "model.layers.41.mlp.experts.151.down_proj", "model.layers.41.mlp.experts.152.down_proj", "model.layers.41.mlp.experts.153.down_proj", "model.layers.41.mlp.experts.154.down_proj", "model.layers.41.mlp.experts.155.down_proj", "model.layers.41.mlp.experts.156.down_proj", "model.layers.41.mlp.experts.157.down_proj", "model.layers.41.mlp.experts.158.down_proj", "model.layers.41.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 1.2405193410815196e-05, "dbits": 1258291200 }, { "dkld": 4.8285070806742755e-05, "dbits": 2516582400 } ] }, { "idx": 249, "layers": [ "model.layers.42.self_attn.q_proj" ], "candidates": [ { "dkld": -4.787300713359616e-06, "dbits": 62914560 }, { "dkld": -1.4796783216296586e-05, "dbits": 125829120 } ] }, { "idx": 250, "layers": [ "model.layers.42.self_attn.k_proj", "model.layers.42.self_attn.v_proj" ], "candidates": [ { "dkld": -0.0002482081297785037, "dbits": 10485760 }, { "dkld": -0.00026132347993552615, "dbits": 20971520 } ] }, { "idx": 251, "layers": [ "model.layers.42.self_attn.o_proj" ], "candidates": [ { "dkld": 5.0069764256477356e-05, "dbits": 62914560 }, { "dkld": 8.10295809060349e-05, "dbits": 125829120 } ] }, { "idx": 252, "layers": [ "model.layers.42.mlp.shared_experts.gate_proj", "model.layers.42.mlp.shared_experts.up_proj", "model.layers.42.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -1.333807595074038e-05, "dbits": 23592960 }, { "dkld": 1.5347427688539722e-05, "dbits": 47185920 } ] }, { "idx": 253, "layers": [ "model.layers.42.mlp.experts.0.gate_proj", "model.layers.42.mlp.experts.1.gate_proj", "model.layers.42.mlp.experts.2.gate_proj", "model.layers.42.mlp.experts.3.gate_proj", "model.layers.42.mlp.experts.4.gate_proj", "model.layers.42.mlp.experts.5.gate_proj", "model.layers.42.mlp.experts.6.gate_proj", "model.layers.42.mlp.experts.7.gate_proj", "model.layers.42.mlp.experts.8.gate_proj", "model.layers.42.mlp.experts.9.gate_proj", "model.layers.42.mlp.experts.10.gate_proj", "model.layers.42.mlp.experts.11.gate_proj", "model.layers.42.mlp.experts.12.gate_proj", "model.layers.42.mlp.experts.13.gate_proj", "model.layers.42.mlp.experts.14.gate_proj", "model.layers.42.mlp.experts.15.gate_proj", "model.layers.42.mlp.experts.16.gate_proj", "model.layers.42.mlp.experts.17.gate_proj", "model.layers.42.mlp.experts.18.gate_proj", "model.layers.42.mlp.experts.19.gate_proj", "model.layers.42.mlp.experts.20.gate_proj", "model.layers.42.mlp.experts.21.gate_proj", "model.layers.42.mlp.experts.22.gate_proj", "model.layers.42.mlp.experts.23.gate_proj", "model.layers.42.mlp.experts.24.gate_proj", "model.layers.42.mlp.experts.25.gate_proj", "model.layers.42.mlp.experts.26.gate_proj", "model.layers.42.mlp.experts.27.gate_proj", "model.layers.42.mlp.experts.28.gate_proj", "model.layers.42.mlp.experts.29.gate_proj", "model.layers.42.mlp.experts.30.gate_proj", "model.layers.42.mlp.experts.31.gate_proj", "model.layers.42.mlp.experts.32.gate_proj", "model.layers.42.mlp.experts.33.gate_proj", "model.layers.42.mlp.experts.34.gate_proj", "model.layers.42.mlp.experts.35.gate_proj", "model.layers.42.mlp.experts.36.gate_proj", "model.layers.42.mlp.experts.37.gate_proj", "model.layers.42.mlp.experts.38.gate_proj", "model.layers.42.mlp.experts.39.gate_proj", "model.layers.42.mlp.experts.40.gate_proj", "model.layers.42.mlp.experts.41.gate_proj", "model.layers.42.mlp.experts.42.gate_proj", "model.layers.42.mlp.experts.43.gate_proj", "model.layers.42.mlp.experts.44.gate_proj", "model.layers.42.mlp.experts.45.gate_proj", "model.layers.42.mlp.experts.46.gate_proj", "model.layers.42.mlp.experts.47.gate_proj", "model.layers.42.mlp.experts.48.gate_proj", "model.layers.42.mlp.experts.49.gate_proj", "model.layers.42.mlp.experts.50.gate_proj", "model.layers.42.mlp.experts.51.gate_proj", "model.layers.42.mlp.experts.52.gate_proj", "model.layers.42.mlp.experts.53.gate_proj", "model.layers.42.mlp.experts.54.gate_proj", "model.layers.42.mlp.experts.55.gate_proj", "model.layers.42.mlp.experts.56.gate_proj", "model.layers.42.mlp.experts.57.gate_proj", "model.layers.42.mlp.experts.58.gate_proj", "model.layers.42.mlp.experts.59.gate_proj", "model.layers.42.mlp.experts.60.gate_proj", "model.layers.42.mlp.experts.61.gate_proj", "model.layers.42.mlp.experts.62.gate_proj", "model.layers.42.mlp.experts.63.gate_proj", "model.layers.42.mlp.experts.64.gate_proj", "model.layers.42.mlp.experts.65.gate_proj", "model.layers.42.mlp.experts.66.gate_proj", "model.layers.42.mlp.experts.67.gate_proj", "model.layers.42.mlp.experts.68.gate_proj", "model.layers.42.mlp.experts.69.gate_proj", "model.layers.42.mlp.experts.70.gate_proj", "model.layers.42.mlp.experts.71.gate_proj", "model.layers.42.mlp.experts.72.gate_proj", "model.layers.42.mlp.experts.73.gate_proj", "model.layers.42.mlp.experts.74.gate_proj", "model.layers.42.mlp.experts.75.gate_proj", "model.layers.42.mlp.experts.76.gate_proj", "model.layers.42.mlp.experts.77.gate_proj", "model.layers.42.mlp.experts.78.gate_proj", "model.layers.42.mlp.experts.79.gate_proj", "model.layers.42.mlp.experts.80.gate_proj", "model.layers.42.mlp.experts.81.gate_proj", "model.layers.42.mlp.experts.82.gate_proj", "model.layers.42.mlp.experts.83.gate_proj", "model.layers.42.mlp.experts.84.gate_proj", "model.layers.42.mlp.experts.85.gate_proj", "model.layers.42.mlp.experts.86.gate_proj", "model.layers.42.mlp.experts.87.gate_proj", "model.layers.42.mlp.experts.88.gate_proj", "model.layers.42.mlp.experts.89.gate_proj", "model.layers.42.mlp.experts.90.gate_proj", "model.layers.42.mlp.experts.91.gate_proj", "model.layers.42.mlp.experts.92.gate_proj", "model.layers.42.mlp.experts.93.gate_proj", "model.layers.42.mlp.experts.94.gate_proj", "model.layers.42.mlp.experts.95.gate_proj", "model.layers.42.mlp.experts.96.gate_proj", "model.layers.42.mlp.experts.97.gate_proj", "model.layers.42.mlp.experts.98.gate_proj", "model.layers.42.mlp.experts.99.gate_proj", "model.layers.42.mlp.experts.100.gate_proj", "model.layers.42.mlp.experts.101.gate_proj", "model.layers.42.mlp.experts.102.gate_proj", "model.layers.42.mlp.experts.103.gate_proj", "model.layers.42.mlp.experts.104.gate_proj", "model.layers.42.mlp.experts.105.gate_proj", "model.layers.42.mlp.experts.106.gate_proj", "model.layers.42.mlp.experts.107.gate_proj", "model.layers.42.mlp.experts.108.gate_proj", "model.layers.42.mlp.experts.109.gate_proj", "model.layers.42.mlp.experts.110.gate_proj", "model.layers.42.mlp.experts.111.gate_proj", "model.layers.42.mlp.experts.112.gate_proj", "model.layers.42.mlp.experts.113.gate_proj", "model.layers.42.mlp.experts.114.gate_proj", "model.layers.42.mlp.experts.115.gate_proj", "model.layers.42.mlp.experts.116.gate_proj", "model.layers.42.mlp.experts.117.gate_proj", "model.layers.42.mlp.experts.118.gate_proj", "model.layers.42.mlp.experts.119.gate_proj", "model.layers.42.mlp.experts.120.gate_proj", "model.layers.42.mlp.experts.121.gate_proj", "model.layers.42.mlp.experts.122.gate_proj", "model.layers.42.mlp.experts.123.gate_proj", "model.layers.42.mlp.experts.124.gate_proj", "model.layers.42.mlp.experts.125.gate_proj", "model.layers.42.mlp.experts.126.gate_proj", "model.layers.42.mlp.experts.127.gate_proj", "model.layers.42.mlp.experts.128.gate_proj", "model.layers.42.mlp.experts.129.gate_proj", "model.layers.42.mlp.experts.130.gate_proj", "model.layers.42.mlp.experts.131.gate_proj", "model.layers.42.mlp.experts.132.gate_proj", "model.layers.42.mlp.experts.133.gate_proj", "model.layers.42.mlp.experts.134.gate_proj", "model.layers.42.mlp.experts.135.gate_proj", "model.layers.42.mlp.experts.136.gate_proj", "model.layers.42.mlp.experts.137.gate_proj", "model.layers.42.mlp.experts.138.gate_proj", "model.layers.42.mlp.experts.139.gate_proj", "model.layers.42.mlp.experts.140.gate_proj", "model.layers.42.mlp.experts.141.gate_proj", "model.layers.42.mlp.experts.142.gate_proj", "model.layers.42.mlp.experts.143.gate_proj", "model.layers.42.mlp.experts.144.gate_proj", "model.layers.42.mlp.experts.145.gate_proj", "model.layers.42.mlp.experts.146.gate_proj", "model.layers.42.mlp.experts.147.gate_proj", "model.layers.42.mlp.experts.148.gate_proj", "model.layers.42.mlp.experts.149.gate_proj", "model.layers.42.mlp.experts.150.gate_proj", "model.layers.42.mlp.experts.151.gate_proj", "model.layers.42.mlp.experts.152.gate_proj", "model.layers.42.mlp.experts.153.gate_proj", "model.layers.42.mlp.experts.154.gate_proj", "model.layers.42.mlp.experts.155.gate_proj", "model.layers.42.mlp.experts.156.gate_proj", "model.layers.42.mlp.experts.157.gate_proj", "model.layers.42.mlp.experts.158.gate_proj", "model.layers.42.mlp.experts.159.gate_proj", "model.layers.42.mlp.experts.0.up_proj", "model.layers.42.mlp.experts.1.up_proj", "model.layers.42.mlp.experts.2.up_proj", "model.layers.42.mlp.experts.3.up_proj", "model.layers.42.mlp.experts.4.up_proj", "model.layers.42.mlp.experts.5.up_proj", "model.layers.42.mlp.experts.6.up_proj", "model.layers.42.mlp.experts.7.up_proj", "model.layers.42.mlp.experts.8.up_proj", "model.layers.42.mlp.experts.9.up_proj", "model.layers.42.mlp.experts.10.up_proj", "model.layers.42.mlp.experts.11.up_proj", "model.layers.42.mlp.experts.12.up_proj", "model.layers.42.mlp.experts.13.up_proj", "model.layers.42.mlp.experts.14.up_proj", "model.layers.42.mlp.experts.15.up_proj", "model.layers.42.mlp.experts.16.up_proj", "model.layers.42.mlp.experts.17.up_proj", "model.layers.42.mlp.experts.18.up_proj", "model.layers.42.mlp.experts.19.up_proj", "model.layers.42.mlp.experts.20.up_proj", "model.layers.42.mlp.experts.21.up_proj", "model.layers.42.mlp.experts.22.up_proj", "model.layers.42.mlp.experts.23.up_proj", "model.layers.42.mlp.experts.24.up_proj", "model.layers.42.mlp.experts.25.up_proj", "model.layers.42.mlp.experts.26.up_proj", "model.layers.42.mlp.experts.27.up_proj", "model.layers.42.mlp.experts.28.up_proj", "model.layers.42.mlp.experts.29.up_proj", "model.layers.42.mlp.experts.30.up_proj", "model.layers.42.mlp.experts.31.up_proj", "model.layers.42.mlp.experts.32.up_proj", "model.layers.42.mlp.experts.33.up_proj", "model.layers.42.mlp.experts.34.up_proj", "model.layers.42.mlp.experts.35.up_proj", "model.layers.42.mlp.experts.36.up_proj", "model.layers.42.mlp.experts.37.up_proj", "model.layers.42.mlp.experts.38.up_proj", "model.layers.42.mlp.experts.39.up_proj", "model.layers.42.mlp.experts.40.up_proj", "model.layers.42.mlp.experts.41.up_proj", "model.layers.42.mlp.experts.42.up_proj", "model.layers.42.mlp.experts.43.up_proj", "model.layers.42.mlp.experts.44.up_proj", "model.layers.42.mlp.experts.45.up_proj", "model.layers.42.mlp.experts.46.up_proj", "model.layers.42.mlp.experts.47.up_proj", "model.layers.42.mlp.experts.48.up_proj", "model.layers.42.mlp.experts.49.up_proj", "model.layers.42.mlp.experts.50.up_proj", "model.layers.42.mlp.experts.51.up_proj", "model.layers.42.mlp.experts.52.up_proj", "model.layers.42.mlp.experts.53.up_proj", "model.layers.42.mlp.experts.54.up_proj", "model.layers.42.mlp.experts.55.up_proj", "model.layers.42.mlp.experts.56.up_proj", "model.layers.42.mlp.experts.57.up_proj", "model.layers.42.mlp.experts.58.up_proj", "model.layers.42.mlp.experts.59.up_proj", "model.layers.42.mlp.experts.60.up_proj", "model.layers.42.mlp.experts.61.up_proj", "model.layers.42.mlp.experts.62.up_proj", "model.layers.42.mlp.experts.63.up_proj", "model.layers.42.mlp.experts.64.up_proj", "model.layers.42.mlp.experts.65.up_proj", "model.layers.42.mlp.experts.66.up_proj", "model.layers.42.mlp.experts.67.up_proj", "model.layers.42.mlp.experts.68.up_proj", "model.layers.42.mlp.experts.69.up_proj", "model.layers.42.mlp.experts.70.up_proj", "model.layers.42.mlp.experts.71.up_proj", "model.layers.42.mlp.experts.72.up_proj", "model.layers.42.mlp.experts.73.up_proj", "model.layers.42.mlp.experts.74.up_proj", "model.layers.42.mlp.experts.75.up_proj", "model.layers.42.mlp.experts.76.up_proj", "model.layers.42.mlp.experts.77.up_proj", "model.layers.42.mlp.experts.78.up_proj", "model.layers.42.mlp.experts.79.up_proj", "model.layers.42.mlp.experts.80.up_proj", "model.layers.42.mlp.experts.81.up_proj", "model.layers.42.mlp.experts.82.up_proj", "model.layers.42.mlp.experts.83.up_proj", "model.layers.42.mlp.experts.84.up_proj", "model.layers.42.mlp.experts.85.up_proj", "model.layers.42.mlp.experts.86.up_proj", "model.layers.42.mlp.experts.87.up_proj", "model.layers.42.mlp.experts.88.up_proj", "model.layers.42.mlp.experts.89.up_proj", "model.layers.42.mlp.experts.90.up_proj", "model.layers.42.mlp.experts.91.up_proj", "model.layers.42.mlp.experts.92.up_proj", "model.layers.42.mlp.experts.93.up_proj", "model.layers.42.mlp.experts.94.up_proj", "model.layers.42.mlp.experts.95.up_proj", "model.layers.42.mlp.experts.96.up_proj", "model.layers.42.mlp.experts.97.up_proj", "model.layers.42.mlp.experts.98.up_proj", "model.layers.42.mlp.experts.99.up_proj", "model.layers.42.mlp.experts.100.up_proj", "model.layers.42.mlp.experts.101.up_proj", "model.layers.42.mlp.experts.102.up_proj", "model.layers.42.mlp.experts.103.up_proj", "model.layers.42.mlp.experts.104.up_proj", "model.layers.42.mlp.experts.105.up_proj", "model.layers.42.mlp.experts.106.up_proj", "model.layers.42.mlp.experts.107.up_proj", "model.layers.42.mlp.experts.108.up_proj", "model.layers.42.mlp.experts.109.up_proj", "model.layers.42.mlp.experts.110.up_proj", "model.layers.42.mlp.experts.111.up_proj", "model.layers.42.mlp.experts.112.up_proj", "model.layers.42.mlp.experts.113.up_proj", "model.layers.42.mlp.experts.114.up_proj", "model.layers.42.mlp.experts.115.up_proj", "model.layers.42.mlp.experts.116.up_proj", "model.layers.42.mlp.experts.117.up_proj", "model.layers.42.mlp.experts.118.up_proj", "model.layers.42.mlp.experts.119.up_proj", "model.layers.42.mlp.experts.120.up_proj", "model.layers.42.mlp.experts.121.up_proj", "model.layers.42.mlp.experts.122.up_proj", "model.layers.42.mlp.experts.123.up_proj", "model.layers.42.mlp.experts.124.up_proj", "model.layers.42.mlp.experts.125.up_proj", "model.layers.42.mlp.experts.126.up_proj", "model.layers.42.mlp.experts.127.up_proj", "model.layers.42.mlp.experts.128.up_proj", "model.layers.42.mlp.experts.129.up_proj", "model.layers.42.mlp.experts.130.up_proj", "model.layers.42.mlp.experts.131.up_proj", "model.layers.42.mlp.experts.132.up_proj", "model.layers.42.mlp.experts.133.up_proj", "model.layers.42.mlp.experts.134.up_proj", "model.layers.42.mlp.experts.135.up_proj", "model.layers.42.mlp.experts.136.up_proj", "model.layers.42.mlp.experts.137.up_proj", "model.layers.42.mlp.experts.138.up_proj", "model.layers.42.mlp.experts.139.up_proj", "model.layers.42.mlp.experts.140.up_proj", "model.layers.42.mlp.experts.141.up_proj", "model.layers.42.mlp.experts.142.up_proj", "model.layers.42.mlp.experts.143.up_proj", "model.layers.42.mlp.experts.144.up_proj", "model.layers.42.mlp.experts.145.up_proj", "model.layers.42.mlp.experts.146.up_proj", "model.layers.42.mlp.experts.147.up_proj", "model.layers.42.mlp.experts.148.up_proj", "model.layers.42.mlp.experts.149.up_proj", "model.layers.42.mlp.experts.150.up_proj", "model.layers.42.mlp.experts.151.up_proj", "model.layers.42.mlp.experts.152.up_proj", "model.layers.42.mlp.experts.153.up_proj", "model.layers.42.mlp.experts.154.up_proj", "model.layers.42.mlp.experts.155.up_proj", "model.layers.42.mlp.experts.156.up_proj", "model.layers.42.mlp.experts.157.up_proj", "model.layers.42.mlp.experts.158.up_proj", "model.layers.42.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -2.0233052782713673e-05, "dbits": 2516582400 }, { "dkld": -3.62154794856899e-05, "dbits": 5033164800 } ] }, { "idx": 254, "layers": [ "model.layers.42.mlp.experts.0.down_proj", "model.layers.42.mlp.experts.1.down_proj", "model.layers.42.mlp.experts.2.down_proj", "model.layers.42.mlp.experts.3.down_proj", "model.layers.42.mlp.experts.4.down_proj", "model.layers.42.mlp.experts.5.down_proj", "model.layers.42.mlp.experts.6.down_proj", "model.layers.42.mlp.experts.7.down_proj", "model.layers.42.mlp.experts.8.down_proj", "model.layers.42.mlp.experts.9.down_proj", "model.layers.42.mlp.experts.10.down_proj", "model.layers.42.mlp.experts.11.down_proj", "model.layers.42.mlp.experts.12.down_proj", "model.layers.42.mlp.experts.13.down_proj", "model.layers.42.mlp.experts.14.down_proj", "model.layers.42.mlp.experts.15.down_proj", "model.layers.42.mlp.experts.16.down_proj", "model.layers.42.mlp.experts.17.down_proj", "model.layers.42.mlp.experts.18.down_proj", "model.layers.42.mlp.experts.19.down_proj", "model.layers.42.mlp.experts.20.down_proj", "model.layers.42.mlp.experts.21.down_proj", "model.layers.42.mlp.experts.22.down_proj", "model.layers.42.mlp.experts.23.down_proj", "model.layers.42.mlp.experts.24.down_proj", "model.layers.42.mlp.experts.25.down_proj", "model.layers.42.mlp.experts.26.down_proj", "model.layers.42.mlp.experts.27.down_proj", "model.layers.42.mlp.experts.28.down_proj", "model.layers.42.mlp.experts.29.down_proj", "model.layers.42.mlp.experts.30.down_proj", "model.layers.42.mlp.experts.31.down_proj", "model.layers.42.mlp.experts.32.down_proj", "model.layers.42.mlp.experts.33.down_proj", "model.layers.42.mlp.experts.34.down_proj", "model.layers.42.mlp.experts.35.down_proj", "model.layers.42.mlp.experts.36.down_proj", "model.layers.42.mlp.experts.37.down_proj", "model.layers.42.mlp.experts.38.down_proj", "model.layers.42.mlp.experts.39.down_proj", "model.layers.42.mlp.experts.40.down_proj", "model.layers.42.mlp.experts.41.down_proj", "model.layers.42.mlp.experts.42.down_proj", "model.layers.42.mlp.experts.43.down_proj", "model.layers.42.mlp.experts.44.down_proj", "model.layers.42.mlp.experts.45.down_proj", "model.layers.42.mlp.experts.46.down_proj", "model.layers.42.mlp.experts.47.down_proj", "model.layers.42.mlp.experts.48.down_proj", "model.layers.42.mlp.experts.49.down_proj", "model.layers.42.mlp.experts.50.down_proj", "model.layers.42.mlp.experts.51.down_proj", "model.layers.42.mlp.experts.52.down_proj", "model.layers.42.mlp.experts.53.down_proj", "model.layers.42.mlp.experts.54.down_proj", "model.layers.42.mlp.experts.55.down_proj", "model.layers.42.mlp.experts.56.down_proj", "model.layers.42.mlp.experts.57.down_proj", "model.layers.42.mlp.experts.58.down_proj", "model.layers.42.mlp.experts.59.down_proj", "model.layers.42.mlp.experts.60.down_proj", "model.layers.42.mlp.experts.61.down_proj", "model.layers.42.mlp.experts.62.down_proj", "model.layers.42.mlp.experts.63.down_proj", "model.layers.42.mlp.experts.64.down_proj", "model.layers.42.mlp.experts.65.down_proj", "model.layers.42.mlp.experts.66.down_proj", "model.layers.42.mlp.experts.67.down_proj", "model.layers.42.mlp.experts.68.down_proj", "model.layers.42.mlp.experts.69.down_proj", "model.layers.42.mlp.experts.70.down_proj", "model.layers.42.mlp.experts.71.down_proj", "model.layers.42.mlp.experts.72.down_proj", "model.layers.42.mlp.experts.73.down_proj", "model.layers.42.mlp.experts.74.down_proj", "model.layers.42.mlp.experts.75.down_proj", "model.layers.42.mlp.experts.76.down_proj", "model.layers.42.mlp.experts.77.down_proj", "model.layers.42.mlp.experts.78.down_proj", "model.layers.42.mlp.experts.79.down_proj", "model.layers.42.mlp.experts.80.down_proj", "model.layers.42.mlp.experts.81.down_proj", "model.layers.42.mlp.experts.82.down_proj", "model.layers.42.mlp.experts.83.down_proj", "model.layers.42.mlp.experts.84.down_proj", "model.layers.42.mlp.experts.85.down_proj", "model.layers.42.mlp.experts.86.down_proj", "model.layers.42.mlp.experts.87.down_proj", "model.layers.42.mlp.experts.88.down_proj", "model.layers.42.mlp.experts.89.down_proj", "model.layers.42.mlp.experts.90.down_proj", "model.layers.42.mlp.experts.91.down_proj", "model.layers.42.mlp.experts.92.down_proj", "model.layers.42.mlp.experts.93.down_proj", "model.layers.42.mlp.experts.94.down_proj", "model.layers.42.mlp.experts.95.down_proj", "model.layers.42.mlp.experts.96.down_proj", "model.layers.42.mlp.experts.97.down_proj", "model.layers.42.mlp.experts.98.down_proj", "model.layers.42.mlp.experts.99.down_proj", "model.layers.42.mlp.experts.100.down_proj", "model.layers.42.mlp.experts.101.down_proj", "model.layers.42.mlp.experts.102.down_proj", "model.layers.42.mlp.experts.103.down_proj", "model.layers.42.mlp.experts.104.down_proj", "model.layers.42.mlp.experts.105.down_proj", "model.layers.42.mlp.experts.106.down_proj", "model.layers.42.mlp.experts.107.down_proj", "model.layers.42.mlp.experts.108.down_proj", "model.layers.42.mlp.experts.109.down_proj", "model.layers.42.mlp.experts.110.down_proj", "model.layers.42.mlp.experts.111.down_proj", "model.layers.42.mlp.experts.112.down_proj", "model.layers.42.mlp.experts.113.down_proj", "model.layers.42.mlp.experts.114.down_proj", "model.layers.42.mlp.experts.115.down_proj", "model.layers.42.mlp.experts.116.down_proj", "model.layers.42.mlp.experts.117.down_proj", "model.layers.42.mlp.experts.118.down_proj", "model.layers.42.mlp.experts.119.down_proj", "model.layers.42.mlp.experts.120.down_proj", "model.layers.42.mlp.experts.121.down_proj", "model.layers.42.mlp.experts.122.down_proj", "model.layers.42.mlp.experts.123.down_proj", "model.layers.42.mlp.experts.124.down_proj", "model.layers.42.mlp.experts.125.down_proj", "model.layers.42.mlp.experts.126.down_proj", "model.layers.42.mlp.experts.127.down_proj", "model.layers.42.mlp.experts.128.down_proj", "model.layers.42.mlp.experts.129.down_proj", "model.layers.42.mlp.experts.130.down_proj", "model.layers.42.mlp.experts.131.down_proj", "model.layers.42.mlp.experts.132.down_proj", "model.layers.42.mlp.experts.133.down_proj", "model.layers.42.mlp.experts.134.down_proj", "model.layers.42.mlp.experts.135.down_proj", "model.layers.42.mlp.experts.136.down_proj", "model.layers.42.mlp.experts.137.down_proj", "model.layers.42.mlp.experts.138.down_proj", "model.layers.42.mlp.experts.139.down_proj", "model.layers.42.mlp.experts.140.down_proj", "model.layers.42.mlp.experts.141.down_proj", "model.layers.42.mlp.experts.142.down_proj", "model.layers.42.mlp.experts.143.down_proj", "model.layers.42.mlp.experts.144.down_proj", "model.layers.42.mlp.experts.145.down_proj", "model.layers.42.mlp.experts.146.down_proj", "model.layers.42.mlp.experts.147.down_proj", "model.layers.42.mlp.experts.148.down_proj", "model.layers.42.mlp.experts.149.down_proj", "model.layers.42.mlp.experts.150.down_proj", "model.layers.42.mlp.experts.151.down_proj", "model.layers.42.mlp.experts.152.down_proj", "model.layers.42.mlp.experts.153.down_proj", "model.layers.42.mlp.experts.154.down_proj", "model.layers.42.mlp.experts.155.down_proj", "model.layers.42.mlp.experts.156.down_proj", "model.layers.42.mlp.experts.157.down_proj", "model.layers.42.mlp.experts.158.down_proj", "model.layers.42.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -3.190129064023495e-05, "dbits": 1258291200 }, { "dkld": -3.1986762769518895e-05, "dbits": 2516582400 } ] }, { "idx": 255, "layers": [ "model.layers.43.self_attn.q_proj" ], "candidates": [ { "dkld": -7.627368904650211e-05, "dbits": 62914560 }, { "dkld": -7.276430260389974e-05, "dbits": 125829120 } ] }, { "idx": 256, "layers": [ "model.layers.43.self_attn.k_proj", "model.layers.43.self_attn.v_proj" ], "candidates": [ { "dkld": 4.878966137766838e-07, "dbits": 10485760 }, { "dkld": 1.351761166006396e-05, "dbits": 20971520 } ] }, { "idx": 257, "layers": [ "model.layers.43.self_attn.o_proj" ], "candidates": [ { "dkld": -0.00010034965816885233, "dbits": 62914560 }, { "dkld": -0.00013116481713950495, "dbits": 125829120 } ] }, { "idx": 258, "layers": [ "model.layers.43.mlp.shared_experts.gate_proj", "model.layers.43.mlp.shared_experts.up_proj", "model.layers.43.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 2.3774267174304226e-05, "dbits": 23592960 }, { "dkld": -1.7489190213382244e-05, "dbits": 47185920 } ] }, { "idx": 259, "layers": [ "model.layers.43.mlp.experts.0.gate_proj", "model.layers.43.mlp.experts.1.gate_proj", "model.layers.43.mlp.experts.2.gate_proj", "model.layers.43.mlp.experts.3.gate_proj", "model.layers.43.mlp.experts.4.gate_proj", "model.layers.43.mlp.experts.5.gate_proj", "model.layers.43.mlp.experts.6.gate_proj", "model.layers.43.mlp.experts.7.gate_proj", "model.layers.43.mlp.experts.8.gate_proj", "model.layers.43.mlp.experts.9.gate_proj", "model.layers.43.mlp.experts.10.gate_proj", "model.layers.43.mlp.experts.11.gate_proj", "model.layers.43.mlp.experts.12.gate_proj", "model.layers.43.mlp.experts.13.gate_proj", "model.layers.43.mlp.experts.14.gate_proj", "model.layers.43.mlp.experts.15.gate_proj", "model.layers.43.mlp.experts.16.gate_proj", "model.layers.43.mlp.experts.17.gate_proj", "model.layers.43.mlp.experts.18.gate_proj", "model.layers.43.mlp.experts.19.gate_proj", "model.layers.43.mlp.experts.20.gate_proj", "model.layers.43.mlp.experts.21.gate_proj", "model.layers.43.mlp.experts.22.gate_proj", "model.layers.43.mlp.experts.23.gate_proj", "model.layers.43.mlp.experts.24.gate_proj", "model.layers.43.mlp.experts.25.gate_proj", "model.layers.43.mlp.experts.26.gate_proj", "model.layers.43.mlp.experts.27.gate_proj", "model.layers.43.mlp.experts.28.gate_proj", "model.layers.43.mlp.experts.29.gate_proj", "model.layers.43.mlp.experts.30.gate_proj", "model.layers.43.mlp.experts.31.gate_proj", "model.layers.43.mlp.experts.32.gate_proj", "model.layers.43.mlp.experts.33.gate_proj", "model.layers.43.mlp.experts.34.gate_proj", "model.layers.43.mlp.experts.35.gate_proj", "model.layers.43.mlp.experts.36.gate_proj", "model.layers.43.mlp.experts.37.gate_proj", "model.layers.43.mlp.experts.38.gate_proj", "model.layers.43.mlp.experts.39.gate_proj", "model.layers.43.mlp.experts.40.gate_proj", "model.layers.43.mlp.experts.41.gate_proj", "model.layers.43.mlp.experts.42.gate_proj", "model.layers.43.mlp.experts.43.gate_proj", "model.layers.43.mlp.experts.44.gate_proj", "model.layers.43.mlp.experts.45.gate_proj", "model.layers.43.mlp.experts.46.gate_proj", "model.layers.43.mlp.experts.47.gate_proj", "model.layers.43.mlp.experts.48.gate_proj", "model.layers.43.mlp.experts.49.gate_proj", "model.layers.43.mlp.experts.50.gate_proj", "model.layers.43.mlp.experts.51.gate_proj", "model.layers.43.mlp.experts.52.gate_proj", "model.layers.43.mlp.experts.53.gate_proj", "model.layers.43.mlp.experts.54.gate_proj", "model.layers.43.mlp.experts.55.gate_proj", "model.layers.43.mlp.experts.56.gate_proj", "model.layers.43.mlp.experts.57.gate_proj", "model.layers.43.mlp.experts.58.gate_proj", "model.layers.43.mlp.experts.59.gate_proj", "model.layers.43.mlp.experts.60.gate_proj", "model.layers.43.mlp.experts.61.gate_proj", "model.layers.43.mlp.experts.62.gate_proj", "model.layers.43.mlp.experts.63.gate_proj", "model.layers.43.mlp.experts.64.gate_proj", "model.layers.43.mlp.experts.65.gate_proj", "model.layers.43.mlp.experts.66.gate_proj", "model.layers.43.mlp.experts.67.gate_proj", "model.layers.43.mlp.experts.68.gate_proj", "model.layers.43.mlp.experts.69.gate_proj", "model.layers.43.mlp.experts.70.gate_proj", "model.layers.43.mlp.experts.71.gate_proj", "model.layers.43.mlp.experts.72.gate_proj", "model.layers.43.mlp.experts.73.gate_proj", "model.layers.43.mlp.experts.74.gate_proj", "model.layers.43.mlp.experts.75.gate_proj", "model.layers.43.mlp.experts.76.gate_proj", "model.layers.43.mlp.experts.77.gate_proj", "model.layers.43.mlp.experts.78.gate_proj", "model.layers.43.mlp.experts.79.gate_proj", "model.layers.43.mlp.experts.80.gate_proj", "model.layers.43.mlp.experts.81.gate_proj", "model.layers.43.mlp.experts.82.gate_proj", "model.layers.43.mlp.experts.83.gate_proj", "model.layers.43.mlp.experts.84.gate_proj", "model.layers.43.mlp.experts.85.gate_proj", "model.layers.43.mlp.experts.86.gate_proj", "model.layers.43.mlp.experts.87.gate_proj", "model.layers.43.mlp.experts.88.gate_proj", "model.layers.43.mlp.experts.89.gate_proj", "model.layers.43.mlp.experts.90.gate_proj", "model.layers.43.mlp.experts.91.gate_proj", "model.layers.43.mlp.experts.92.gate_proj", "model.layers.43.mlp.experts.93.gate_proj", "model.layers.43.mlp.experts.94.gate_proj", "model.layers.43.mlp.experts.95.gate_proj", "model.layers.43.mlp.experts.96.gate_proj", "model.layers.43.mlp.experts.97.gate_proj", "model.layers.43.mlp.experts.98.gate_proj", "model.layers.43.mlp.experts.99.gate_proj", "model.layers.43.mlp.experts.100.gate_proj", "model.layers.43.mlp.experts.101.gate_proj", "model.layers.43.mlp.experts.102.gate_proj", "model.layers.43.mlp.experts.103.gate_proj", "model.layers.43.mlp.experts.104.gate_proj", "model.layers.43.mlp.experts.105.gate_proj", "model.layers.43.mlp.experts.106.gate_proj", "model.layers.43.mlp.experts.107.gate_proj", "model.layers.43.mlp.experts.108.gate_proj", "model.layers.43.mlp.experts.109.gate_proj", "model.layers.43.mlp.experts.110.gate_proj", "model.layers.43.mlp.experts.111.gate_proj", "model.layers.43.mlp.experts.112.gate_proj", "model.layers.43.mlp.experts.113.gate_proj", "model.layers.43.mlp.experts.114.gate_proj", "model.layers.43.mlp.experts.115.gate_proj", "model.layers.43.mlp.experts.116.gate_proj", "model.layers.43.mlp.experts.117.gate_proj", "model.layers.43.mlp.experts.118.gate_proj", "model.layers.43.mlp.experts.119.gate_proj", "model.layers.43.mlp.experts.120.gate_proj", "model.layers.43.mlp.experts.121.gate_proj", "model.layers.43.mlp.experts.122.gate_proj", "model.layers.43.mlp.experts.123.gate_proj", "model.layers.43.mlp.experts.124.gate_proj", "model.layers.43.mlp.experts.125.gate_proj", "model.layers.43.mlp.experts.126.gate_proj", "model.layers.43.mlp.experts.127.gate_proj", "model.layers.43.mlp.experts.128.gate_proj", "model.layers.43.mlp.experts.129.gate_proj", "model.layers.43.mlp.experts.130.gate_proj", "model.layers.43.mlp.experts.131.gate_proj", "model.layers.43.mlp.experts.132.gate_proj", "model.layers.43.mlp.experts.133.gate_proj", "model.layers.43.mlp.experts.134.gate_proj", "model.layers.43.mlp.experts.135.gate_proj", "model.layers.43.mlp.experts.136.gate_proj", "model.layers.43.mlp.experts.137.gate_proj", "model.layers.43.mlp.experts.138.gate_proj", "model.layers.43.mlp.experts.139.gate_proj", "model.layers.43.mlp.experts.140.gate_proj", "model.layers.43.mlp.experts.141.gate_proj", "model.layers.43.mlp.experts.142.gate_proj", "model.layers.43.mlp.experts.143.gate_proj", "model.layers.43.mlp.experts.144.gate_proj", "model.layers.43.mlp.experts.145.gate_proj", "model.layers.43.mlp.experts.146.gate_proj", "model.layers.43.mlp.experts.147.gate_proj", "model.layers.43.mlp.experts.148.gate_proj", "model.layers.43.mlp.experts.149.gate_proj", "model.layers.43.mlp.experts.150.gate_proj", "model.layers.43.mlp.experts.151.gate_proj", "model.layers.43.mlp.experts.152.gate_proj", "model.layers.43.mlp.experts.153.gate_proj", "model.layers.43.mlp.experts.154.gate_proj", "model.layers.43.mlp.experts.155.gate_proj", "model.layers.43.mlp.experts.156.gate_proj", "model.layers.43.mlp.experts.157.gate_proj", "model.layers.43.mlp.experts.158.gate_proj", "model.layers.43.mlp.experts.159.gate_proj", "model.layers.43.mlp.experts.0.up_proj", "model.layers.43.mlp.experts.1.up_proj", "model.layers.43.mlp.experts.2.up_proj", "model.layers.43.mlp.experts.3.up_proj", "model.layers.43.mlp.experts.4.up_proj", "model.layers.43.mlp.experts.5.up_proj", "model.layers.43.mlp.experts.6.up_proj", "model.layers.43.mlp.experts.7.up_proj", "model.layers.43.mlp.experts.8.up_proj", "model.layers.43.mlp.experts.9.up_proj", "model.layers.43.mlp.experts.10.up_proj", "model.layers.43.mlp.experts.11.up_proj", "model.layers.43.mlp.experts.12.up_proj", "model.layers.43.mlp.experts.13.up_proj", "model.layers.43.mlp.experts.14.up_proj", "model.layers.43.mlp.experts.15.up_proj", "model.layers.43.mlp.experts.16.up_proj", "model.layers.43.mlp.experts.17.up_proj", "model.layers.43.mlp.experts.18.up_proj", "model.layers.43.mlp.experts.19.up_proj", "model.layers.43.mlp.experts.20.up_proj", "model.layers.43.mlp.experts.21.up_proj", "model.layers.43.mlp.experts.22.up_proj", "model.layers.43.mlp.experts.23.up_proj", "model.layers.43.mlp.experts.24.up_proj", "model.layers.43.mlp.experts.25.up_proj", "model.layers.43.mlp.experts.26.up_proj", "model.layers.43.mlp.experts.27.up_proj", "model.layers.43.mlp.experts.28.up_proj", "model.layers.43.mlp.experts.29.up_proj", "model.layers.43.mlp.experts.30.up_proj", "model.layers.43.mlp.experts.31.up_proj", "model.layers.43.mlp.experts.32.up_proj", "model.layers.43.mlp.experts.33.up_proj", "model.layers.43.mlp.experts.34.up_proj", "model.layers.43.mlp.experts.35.up_proj", "model.layers.43.mlp.experts.36.up_proj", "model.layers.43.mlp.experts.37.up_proj", "model.layers.43.mlp.experts.38.up_proj", "model.layers.43.mlp.experts.39.up_proj", "model.layers.43.mlp.experts.40.up_proj", "model.layers.43.mlp.experts.41.up_proj", "model.layers.43.mlp.experts.42.up_proj", "model.layers.43.mlp.experts.43.up_proj", "model.layers.43.mlp.experts.44.up_proj", "model.layers.43.mlp.experts.45.up_proj", "model.layers.43.mlp.experts.46.up_proj", "model.layers.43.mlp.experts.47.up_proj", "model.layers.43.mlp.experts.48.up_proj", "model.layers.43.mlp.experts.49.up_proj", "model.layers.43.mlp.experts.50.up_proj", "model.layers.43.mlp.experts.51.up_proj", "model.layers.43.mlp.experts.52.up_proj", "model.layers.43.mlp.experts.53.up_proj", "model.layers.43.mlp.experts.54.up_proj", "model.layers.43.mlp.experts.55.up_proj", "model.layers.43.mlp.experts.56.up_proj", "model.layers.43.mlp.experts.57.up_proj", "model.layers.43.mlp.experts.58.up_proj", "model.layers.43.mlp.experts.59.up_proj", "model.layers.43.mlp.experts.60.up_proj", "model.layers.43.mlp.experts.61.up_proj", "model.layers.43.mlp.experts.62.up_proj", "model.layers.43.mlp.experts.63.up_proj", "model.layers.43.mlp.experts.64.up_proj", "model.layers.43.mlp.experts.65.up_proj", "model.layers.43.mlp.experts.66.up_proj", "model.layers.43.mlp.experts.67.up_proj", "model.layers.43.mlp.experts.68.up_proj", "model.layers.43.mlp.experts.69.up_proj", "model.layers.43.mlp.experts.70.up_proj", "model.layers.43.mlp.experts.71.up_proj", "model.layers.43.mlp.experts.72.up_proj", "model.layers.43.mlp.experts.73.up_proj", "model.layers.43.mlp.experts.74.up_proj", "model.layers.43.mlp.experts.75.up_proj", "model.layers.43.mlp.experts.76.up_proj", "model.layers.43.mlp.experts.77.up_proj", "model.layers.43.mlp.experts.78.up_proj", "model.layers.43.mlp.experts.79.up_proj", "model.layers.43.mlp.experts.80.up_proj", "model.layers.43.mlp.experts.81.up_proj", "model.layers.43.mlp.experts.82.up_proj", "model.layers.43.mlp.experts.83.up_proj", "model.layers.43.mlp.experts.84.up_proj", "model.layers.43.mlp.experts.85.up_proj", "model.layers.43.mlp.experts.86.up_proj", "model.layers.43.mlp.experts.87.up_proj", "model.layers.43.mlp.experts.88.up_proj", "model.layers.43.mlp.experts.89.up_proj", "model.layers.43.mlp.experts.90.up_proj", "model.layers.43.mlp.experts.91.up_proj", "model.layers.43.mlp.experts.92.up_proj", "model.layers.43.mlp.experts.93.up_proj", "model.layers.43.mlp.experts.94.up_proj", "model.layers.43.mlp.experts.95.up_proj", "model.layers.43.mlp.experts.96.up_proj", "model.layers.43.mlp.experts.97.up_proj", "model.layers.43.mlp.experts.98.up_proj", "model.layers.43.mlp.experts.99.up_proj", "model.layers.43.mlp.experts.100.up_proj", "model.layers.43.mlp.experts.101.up_proj", "model.layers.43.mlp.experts.102.up_proj", "model.layers.43.mlp.experts.103.up_proj", "model.layers.43.mlp.experts.104.up_proj", "model.layers.43.mlp.experts.105.up_proj", "model.layers.43.mlp.experts.106.up_proj", "model.layers.43.mlp.experts.107.up_proj", "model.layers.43.mlp.experts.108.up_proj", "model.layers.43.mlp.experts.109.up_proj", "model.layers.43.mlp.experts.110.up_proj", "model.layers.43.mlp.experts.111.up_proj", "model.layers.43.mlp.experts.112.up_proj", "model.layers.43.mlp.experts.113.up_proj", "model.layers.43.mlp.experts.114.up_proj", "model.layers.43.mlp.experts.115.up_proj", "model.layers.43.mlp.experts.116.up_proj", "model.layers.43.mlp.experts.117.up_proj", "model.layers.43.mlp.experts.118.up_proj", "model.layers.43.mlp.experts.119.up_proj", "model.layers.43.mlp.experts.120.up_proj", "model.layers.43.mlp.experts.121.up_proj", "model.layers.43.mlp.experts.122.up_proj", "model.layers.43.mlp.experts.123.up_proj", "model.layers.43.mlp.experts.124.up_proj", "model.layers.43.mlp.experts.125.up_proj", "model.layers.43.mlp.experts.126.up_proj", "model.layers.43.mlp.experts.127.up_proj", "model.layers.43.mlp.experts.128.up_proj", "model.layers.43.mlp.experts.129.up_proj", "model.layers.43.mlp.experts.130.up_proj", "model.layers.43.mlp.experts.131.up_proj", "model.layers.43.mlp.experts.132.up_proj", "model.layers.43.mlp.experts.133.up_proj", "model.layers.43.mlp.experts.134.up_proj", "model.layers.43.mlp.experts.135.up_proj", "model.layers.43.mlp.experts.136.up_proj", "model.layers.43.mlp.experts.137.up_proj", "model.layers.43.mlp.experts.138.up_proj", "model.layers.43.mlp.experts.139.up_proj", "model.layers.43.mlp.experts.140.up_proj", "model.layers.43.mlp.experts.141.up_proj", "model.layers.43.mlp.experts.142.up_proj", "model.layers.43.mlp.experts.143.up_proj", "model.layers.43.mlp.experts.144.up_proj", "model.layers.43.mlp.experts.145.up_proj", "model.layers.43.mlp.experts.146.up_proj", "model.layers.43.mlp.experts.147.up_proj", "model.layers.43.mlp.experts.148.up_proj", "model.layers.43.mlp.experts.149.up_proj", "model.layers.43.mlp.experts.150.up_proj", "model.layers.43.mlp.experts.151.up_proj", "model.layers.43.mlp.experts.152.up_proj", "model.layers.43.mlp.experts.153.up_proj", "model.layers.43.mlp.experts.154.up_proj", "model.layers.43.mlp.experts.155.up_proj", "model.layers.43.mlp.experts.156.up_proj", "model.layers.43.mlp.experts.157.up_proj", "model.layers.43.mlp.experts.158.up_proj", "model.layers.43.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -9.81474295258522e-06, "dbits": 2516582400 }, { "dkld": -2.4272524751721772e-05, "dbits": 5033164800 } ] }, { "idx": 260, "layers": [ "model.layers.43.mlp.experts.0.down_proj", "model.layers.43.mlp.experts.1.down_proj", "model.layers.43.mlp.experts.2.down_proj", "model.layers.43.mlp.experts.3.down_proj", "model.layers.43.mlp.experts.4.down_proj", "model.layers.43.mlp.experts.5.down_proj", "model.layers.43.mlp.experts.6.down_proj", "model.layers.43.mlp.experts.7.down_proj", "model.layers.43.mlp.experts.8.down_proj", "model.layers.43.mlp.experts.9.down_proj", "model.layers.43.mlp.experts.10.down_proj", "model.layers.43.mlp.experts.11.down_proj", "model.layers.43.mlp.experts.12.down_proj", "model.layers.43.mlp.experts.13.down_proj", "model.layers.43.mlp.experts.14.down_proj", "model.layers.43.mlp.experts.15.down_proj", "model.layers.43.mlp.experts.16.down_proj", "model.layers.43.mlp.experts.17.down_proj", "model.layers.43.mlp.experts.18.down_proj", "model.layers.43.mlp.experts.19.down_proj", "model.layers.43.mlp.experts.20.down_proj", "model.layers.43.mlp.experts.21.down_proj", "model.layers.43.mlp.experts.22.down_proj", "model.layers.43.mlp.experts.23.down_proj", "model.layers.43.mlp.experts.24.down_proj", "model.layers.43.mlp.experts.25.down_proj", "model.layers.43.mlp.experts.26.down_proj", "model.layers.43.mlp.experts.27.down_proj", "model.layers.43.mlp.experts.28.down_proj", "model.layers.43.mlp.experts.29.down_proj", "model.layers.43.mlp.experts.30.down_proj", "model.layers.43.mlp.experts.31.down_proj", "model.layers.43.mlp.experts.32.down_proj", "model.layers.43.mlp.experts.33.down_proj", "model.layers.43.mlp.experts.34.down_proj", "model.layers.43.mlp.experts.35.down_proj", "model.layers.43.mlp.experts.36.down_proj", "model.layers.43.mlp.experts.37.down_proj", "model.layers.43.mlp.experts.38.down_proj", "model.layers.43.mlp.experts.39.down_proj", "model.layers.43.mlp.experts.40.down_proj", "model.layers.43.mlp.experts.41.down_proj", "model.layers.43.mlp.experts.42.down_proj", "model.layers.43.mlp.experts.43.down_proj", "model.layers.43.mlp.experts.44.down_proj", "model.layers.43.mlp.experts.45.down_proj", "model.layers.43.mlp.experts.46.down_proj", "model.layers.43.mlp.experts.47.down_proj", "model.layers.43.mlp.experts.48.down_proj", "model.layers.43.mlp.experts.49.down_proj", "model.layers.43.mlp.experts.50.down_proj", "model.layers.43.mlp.experts.51.down_proj", "model.layers.43.mlp.experts.52.down_proj", "model.layers.43.mlp.experts.53.down_proj", "model.layers.43.mlp.experts.54.down_proj", "model.layers.43.mlp.experts.55.down_proj", "model.layers.43.mlp.experts.56.down_proj", "model.layers.43.mlp.experts.57.down_proj", "model.layers.43.mlp.experts.58.down_proj", "model.layers.43.mlp.experts.59.down_proj", "model.layers.43.mlp.experts.60.down_proj", "model.layers.43.mlp.experts.61.down_proj", "model.layers.43.mlp.experts.62.down_proj", "model.layers.43.mlp.experts.63.down_proj", "model.layers.43.mlp.experts.64.down_proj", "model.layers.43.mlp.experts.65.down_proj", "model.layers.43.mlp.experts.66.down_proj", "model.layers.43.mlp.experts.67.down_proj", "model.layers.43.mlp.experts.68.down_proj", "model.layers.43.mlp.experts.69.down_proj", "model.layers.43.mlp.experts.70.down_proj", "model.layers.43.mlp.experts.71.down_proj", "model.layers.43.mlp.experts.72.down_proj", "model.layers.43.mlp.experts.73.down_proj", "model.layers.43.mlp.experts.74.down_proj", "model.layers.43.mlp.experts.75.down_proj", "model.layers.43.mlp.experts.76.down_proj", "model.layers.43.mlp.experts.77.down_proj", "model.layers.43.mlp.experts.78.down_proj", "model.layers.43.mlp.experts.79.down_proj", "model.layers.43.mlp.experts.80.down_proj", "model.layers.43.mlp.experts.81.down_proj", "model.layers.43.mlp.experts.82.down_proj", "model.layers.43.mlp.experts.83.down_proj", "model.layers.43.mlp.experts.84.down_proj", "model.layers.43.mlp.experts.85.down_proj", "model.layers.43.mlp.experts.86.down_proj", "model.layers.43.mlp.experts.87.down_proj", "model.layers.43.mlp.experts.88.down_proj", "model.layers.43.mlp.experts.89.down_proj", "model.layers.43.mlp.experts.90.down_proj", "model.layers.43.mlp.experts.91.down_proj", "model.layers.43.mlp.experts.92.down_proj", "model.layers.43.mlp.experts.93.down_proj", "model.layers.43.mlp.experts.94.down_proj", "model.layers.43.mlp.experts.95.down_proj", "model.layers.43.mlp.experts.96.down_proj", "model.layers.43.mlp.experts.97.down_proj", "model.layers.43.mlp.experts.98.down_proj", "model.layers.43.mlp.experts.99.down_proj", "model.layers.43.mlp.experts.100.down_proj", "model.layers.43.mlp.experts.101.down_proj", "model.layers.43.mlp.experts.102.down_proj", "model.layers.43.mlp.experts.103.down_proj", "model.layers.43.mlp.experts.104.down_proj", "model.layers.43.mlp.experts.105.down_proj", "model.layers.43.mlp.experts.106.down_proj", "model.layers.43.mlp.experts.107.down_proj", "model.layers.43.mlp.experts.108.down_proj", "model.layers.43.mlp.experts.109.down_proj", "model.layers.43.mlp.experts.110.down_proj", "model.layers.43.mlp.experts.111.down_proj", "model.layers.43.mlp.experts.112.down_proj", "model.layers.43.mlp.experts.113.down_proj", "model.layers.43.mlp.experts.114.down_proj", "model.layers.43.mlp.experts.115.down_proj", "model.layers.43.mlp.experts.116.down_proj", "model.layers.43.mlp.experts.117.down_proj", "model.layers.43.mlp.experts.118.down_proj", "model.layers.43.mlp.experts.119.down_proj", "model.layers.43.mlp.experts.120.down_proj", "model.layers.43.mlp.experts.121.down_proj", "model.layers.43.mlp.experts.122.down_proj", "model.layers.43.mlp.experts.123.down_proj", "model.layers.43.mlp.experts.124.down_proj", "model.layers.43.mlp.experts.125.down_proj", "model.layers.43.mlp.experts.126.down_proj", "model.layers.43.mlp.experts.127.down_proj", "model.layers.43.mlp.experts.128.down_proj", "model.layers.43.mlp.experts.129.down_proj", "model.layers.43.mlp.experts.130.down_proj", "model.layers.43.mlp.experts.131.down_proj", "model.layers.43.mlp.experts.132.down_proj", "model.layers.43.mlp.experts.133.down_proj", "model.layers.43.mlp.experts.134.down_proj", "model.layers.43.mlp.experts.135.down_proj", "model.layers.43.mlp.experts.136.down_proj", "model.layers.43.mlp.experts.137.down_proj", "model.layers.43.mlp.experts.138.down_proj", "model.layers.43.mlp.experts.139.down_proj", "model.layers.43.mlp.experts.140.down_proj", "model.layers.43.mlp.experts.141.down_proj", "model.layers.43.mlp.experts.142.down_proj", "model.layers.43.mlp.experts.143.down_proj", "model.layers.43.mlp.experts.144.down_proj", "model.layers.43.mlp.experts.145.down_proj", "model.layers.43.mlp.experts.146.down_proj", "model.layers.43.mlp.experts.147.down_proj", "model.layers.43.mlp.experts.148.down_proj", "model.layers.43.mlp.experts.149.down_proj", "model.layers.43.mlp.experts.150.down_proj", "model.layers.43.mlp.experts.151.down_proj", "model.layers.43.mlp.experts.152.down_proj", "model.layers.43.mlp.experts.153.down_proj", "model.layers.43.mlp.experts.154.down_proj", "model.layers.43.mlp.experts.155.down_proj", "model.layers.43.mlp.experts.156.down_proj", "model.layers.43.mlp.experts.157.down_proj", "model.layers.43.mlp.experts.158.down_proj", "model.layers.43.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 9.562727063894619e-06, "dbits": 1258291200 }, { "dkld": 1.412192359566758e-05, "dbits": 2516582400 } ] }, { "idx": 261, "layers": [ "model.layers.44.self_attn.q_proj" ], "candidates": [ { "dkld": 4.407810047270255e-06, "dbits": 62914560 }, { "dkld": -3.173844888806204e-05, "dbits": 125829120 } ] }, { "idx": 262, "layers": [ "model.layers.44.self_attn.k_proj", "model.layers.44.self_attn.v_proj" ], "candidates": [ { "dkld": 8.724131621420418e-05, "dbits": 10485760 }, { "dkld": 0.0001423344481736432, "dbits": 20971520 } ] }, { "idx": 263, "layers": [ "model.layers.44.self_attn.o_proj" ], "candidates": [ { "dkld": -7.953024469315936e-05, "dbits": 62914560 }, { "dkld": -7.812574040144682e-05, "dbits": 125829120 } ] }, { "idx": 264, "layers": [ "model.layers.44.mlp.shared_experts.gate_proj", "model.layers.44.mlp.shared_experts.up_proj", "model.layers.44.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -9.357202798128059e-05, "dbits": 23592960 }, { "dkld": -6.352183409035102e-05, "dbits": 47185920 } ] }, { "idx": 265, "layers": [ "model.layers.44.mlp.experts.0.gate_proj", "model.layers.44.mlp.experts.1.gate_proj", "model.layers.44.mlp.experts.2.gate_proj", "model.layers.44.mlp.experts.3.gate_proj", "model.layers.44.mlp.experts.4.gate_proj", "model.layers.44.mlp.experts.5.gate_proj", "model.layers.44.mlp.experts.6.gate_proj", "model.layers.44.mlp.experts.7.gate_proj", "model.layers.44.mlp.experts.8.gate_proj", "model.layers.44.mlp.experts.9.gate_proj", "model.layers.44.mlp.experts.10.gate_proj", "model.layers.44.mlp.experts.11.gate_proj", "model.layers.44.mlp.experts.12.gate_proj", "model.layers.44.mlp.experts.13.gate_proj", "model.layers.44.mlp.experts.14.gate_proj", "model.layers.44.mlp.experts.15.gate_proj", "model.layers.44.mlp.experts.16.gate_proj", "model.layers.44.mlp.experts.17.gate_proj", "model.layers.44.mlp.experts.18.gate_proj", "model.layers.44.mlp.experts.19.gate_proj", "model.layers.44.mlp.experts.20.gate_proj", "model.layers.44.mlp.experts.21.gate_proj", "model.layers.44.mlp.experts.22.gate_proj", "model.layers.44.mlp.experts.23.gate_proj", "model.layers.44.mlp.experts.24.gate_proj", "model.layers.44.mlp.experts.25.gate_proj", "model.layers.44.mlp.experts.26.gate_proj", "model.layers.44.mlp.experts.27.gate_proj", "model.layers.44.mlp.experts.28.gate_proj", "model.layers.44.mlp.experts.29.gate_proj", "model.layers.44.mlp.experts.30.gate_proj", "model.layers.44.mlp.experts.31.gate_proj", "model.layers.44.mlp.experts.32.gate_proj", "model.layers.44.mlp.experts.33.gate_proj", "model.layers.44.mlp.experts.34.gate_proj", "model.layers.44.mlp.experts.35.gate_proj", "model.layers.44.mlp.experts.36.gate_proj", "model.layers.44.mlp.experts.37.gate_proj", "model.layers.44.mlp.experts.38.gate_proj", "model.layers.44.mlp.experts.39.gate_proj", "model.layers.44.mlp.experts.40.gate_proj", "model.layers.44.mlp.experts.41.gate_proj", "model.layers.44.mlp.experts.42.gate_proj", "model.layers.44.mlp.experts.43.gate_proj", "model.layers.44.mlp.experts.44.gate_proj", "model.layers.44.mlp.experts.45.gate_proj", "model.layers.44.mlp.experts.46.gate_proj", "model.layers.44.mlp.experts.47.gate_proj", "model.layers.44.mlp.experts.48.gate_proj", "model.layers.44.mlp.experts.49.gate_proj", "model.layers.44.mlp.experts.50.gate_proj", "model.layers.44.mlp.experts.51.gate_proj", "model.layers.44.mlp.experts.52.gate_proj", "model.layers.44.mlp.experts.53.gate_proj", "model.layers.44.mlp.experts.54.gate_proj", "model.layers.44.mlp.experts.55.gate_proj", "model.layers.44.mlp.experts.56.gate_proj", "model.layers.44.mlp.experts.57.gate_proj", "model.layers.44.mlp.experts.58.gate_proj", "model.layers.44.mlp.experts.59.gate_proj", "model.layers.44.mlp.experts.60.gate_proj", "model.layers.44.mlp.experts.61.gate_proj", "model.layers.44.mlp.experts.62.gate_proj", "model.layers.44.mlp.experts.63.gate_proj", "model.layers.44.mlp.experts.64.gate_proj", "model.layers.44.mlp.experts.65.gate_proj", "model.layers.44.mlp.experts.66.gate_proj", "model.layers.44.mlp.experts.67.gate_proj", "model.layers.44.mlp.experts.68.gate_proj", "model.layers.44.mlp.experts.69.gate_proj", "model.layers.44.mlp.experts.70.gate_proj", "model.layers.44.mlp.experts.71.gate_proj", "model.layers.44.mlp.experts.72.gate_proj", "model.layers.44.mlp.experts.73.gate_proj", "model.layers.44.mlp.experts.74.gate_proj", "model.layers.44.mlp.experts.75.gate_proj", "model.layers.44.mlp.experts.76.gate_proj", "model.layers.44.mlp.experts.77.gate_proj", "model.layers.44.mlp.experts.78.gate_proj", "model.layers.44.mlp.experts.79.gate_proj", "model.layers.44.mlp.experts.80.gate_proj", "model.layers.44.mlp.experts.81.gate_proj", "model.layers.44.mlp.experts.82.gate_proj", "model.layers.44.mlp.experts.83.gate_proj", "model.layers.44.mlp.experts.84.gate_proj", "model.layers.44.mlp.experts.85.gate_proj", "model.layers.44.mlp.experts.86.gate_proj", "model.layers.44.mlp.experts.87.gate_proj", "model.layers.44.mlp.experts.88.gate_proj", "model.layers.44.mlp.experts.89.gate_proj", "model.layers.44.mlp.experts.90.gate_proj", "model.layers.44.mlp.experts.91.gate_proj", "model.layers.44.mlp.experts.92.gate_proj", "model.layers.44.mlp.experts.93.gate_proj", "model.layers.44.mlp.experts.94.gate_proj", "model.layers.44.mlp.experts.95.gate_proj", "model.layers.44.mlp.experts.96.gate_proj", "model.layers.44.mlp.experts.97.gate_proj", "model.layers.44.mlp.experts.98.gate_proj", "model.layers.44.mlp.experts.99.gate_proj", "model.layers.44.mlp.experts.100.gate_proj", "model.layers.44.mlp.experts.101.gate_proj", "model.layers.44.mlp.experts.102.gate_proj", "model.layers.44.mlp.experts.103.gate_proj", "model.layers.44.mlp.experts.104.gate_proj", "model.layers.44.mlp.experts.105.gate_proj", "model.layers.44.mlp.experts.106.gate_proj", "model.layers.44.mlp.experts.107.gate_proj", "model.layers.44.mlp.experts.108.gate_proj", "model.layers.44.mlp.experts.109.gate_proj", "model.layers.44.mlp.experts.110.gate_proj", "model.layers.44.mlp.experts.111.gate_proj", "model.layers.44.mlp.experts.112.gate_proj", "model.layers.44.mlp.experts.113.gate_proj", "model.layers.44.mlp.experts.114.gate_proj", "model.layers.44.mlp.experts.115.gate_proj", "model.layers.44.mlp.experts.116.gate_proj", "model.layers.44.mlp.experts.117.gate_proj", "model.layers.44.mlp.experts.118.gate_proj", "model.layers.44.mlp.experts.119.gate_proj", "model.layers.44.mlp.experts.120.gate_proj", "model.layers.44.mlp.experts.121.gate_proj", "model.layers.44.mlp.experts.122.gate_proj", "model.layers.44.mlp.experts.123.gate_proj", "model.layers.44.mlp.experts.124.gate_proj", "model.layers.44.mlp.experts.125.gate_proj", "model.layers.44.mlp.experts.126.gate_proj", "model.layers.44.mlp.experts.127.gate_proj", "model.layers.44.mlp.experts.128.gate_proj", "model.layers.44.mlp.experts.129.gate_proj", "model.layers.44.mlp.experts.130.gate_proj", "model.layers.44.mlp.experts.131.gate_proj", "model.layers.44.mlp.experts.132.gate_proj", "model.layers.44.mlp.experts.133.gate_proj", "model.layers.44.mlp.experts.134.gate_proj", "model.layers.44.mlp.experts.135.gate_proj", "model.layers.44.mlp.experts.136.gate_proj", "model.layers.44.mlp.experts.137.gate_proj", "model.layers.44.mlp.experts.138.gate_proj", "model.layers.44.mlp.experts.139.gate_proj", "model.layers.44.mlp.experts.140.gate_proj", "model.layers.44.mlp.experts.141.gate_proj", "model.layers.44.mlp.experts.142.gate_proj", "model.layers.44.mlp.experts.143.gate_proj", "model.layers.44.mlp.experts.144.gate_proj", "model.layers.44.mlp.experts.145.gate_proj", "model.layers.44.mlp.experts.146.gate_proj", "model.layers.44.mlp.experts.147.gate_proj", "model.layers.44.mlp.experts.148.gate_proj", "model.layers.44.mlp.experts.149.gate_proj", "model.layers.44.mlp.experts.150.gate_proj", "model.layers.44.mlp.experts.151.gate_proj", "model.layers.44.mlp.experts.152.gate_proj", "model.layers.44.mlp.experts.153.gate_proj", "model.layers.44.mlp.experts.154.gate_proj", "model.layers.44.mlp.experts.155.gate_proj", "model.layers.44.mlp.experts.156.gate_proj", "model.layers.44.mlp.experts.157.gate_proj", "model.layers.44.mlp.experts.158.gate_proj", "model.layers.44.mlp.experts.159.gate_proj", "model.layers.44.mlp.experts.0.up_proj", "model.layers.44.mlp.experts.1.up_proj", "model.layers.44.mlp.experts.2.up_proj", "model.layers.44.mlp.experts.3.up_proj", "model.layers.44.mlp.experts.4.up_proj", "model.layers.44.mlp.experts.5.up_proj", "model.layers.44.mlp.experts.6.up_proj", "model.layers.44.mlp.experts.7.up_proj", "model.layers.44.mlp.experts.8.up_proj", "model.layers.44.mlp.experts.9.up_proj", "model.layers.44.mlp.experts.10.up_proj", "model.layers.44.mlp.experts.11.up_proj", "model.layers.44.mlp.experts.12.up_proj", "model.layers.44.mlp.experts.13.up_proj", "model.layers.44.mlp.experts.14.up_proj", "model.layers.44.mlp.experts.15.up_proj", "model.layers.44.mlp.experts.16.up_proj", "model.layers.44.mlp.experts.17.up_proj", "model.layers.44.mlp.experts.18.up_proj", "model.layers.44.mlp.experts.19.up_proj", "model.layers.44.mlp.experts.20.up_proj", "model.layers.44.mlp.experts.21.up_proj", "model.layers.44.mlp.experts.22.up_proj", "model.layers.44.mlp.experts.23.up_proj", "model.layers.44.mlp.experts.24.up_proj", "model.layers.44.mlp.experts.25.up_proj", "model.layers.44.mlp.experts.26.up_proj", "model.layers.44.mlp.experts.27.up_proj", "model.layers.44.mlp.experts.28.up_proj", "model.layers.44.mlp.experts.29.up_proj", "model.layers.44.mlp.experts.30.up_proj", "model.layers.44.mlp.experts.31.up_proj", "model.layers.44.mlp.experts.32.up_proj", "model.layers.44.mlp.experts.33.up_proj", "model.layers.44.mlp.experts.34.up_proj", "model.layers.44.mlp.experts.35.up_proj", "model.layers.44.mlp.experts.36.up_proj", "model.layers.44.mlp.experts.37.up_proj", "model.layers.44.mlp.experts.38.up_proj", "model.layers.44.mlp.experts.39.up_proj", "model.layers.44.mlp.experts.40.up_proj", "model.layers.44.mlp.experts.41.up_proj", "model.layers.44.mlp.experts.42.up_proj", "model.layers.44.mlp.experts.43.up_proj", "model.layers.44.mlp.experts.44.up_proj", "model.layers.44.mlp.experts.45.up_proj", "model.layers.44.mlp.experts.46.up_proj", "model.layers.44.mlp.experts.47.up_proj", "model.layers.44.mlp.experts.48.up_proj", "model.layers.44.mlp.experts.49.up_proj", "model.layers.44.mlp.experts.50.up_proj", "model.layers.44.mlp.experts.51.up_proj", "model.layers.44.mlp.experts.52.up_proj", "model.layers.44.mlp.experts.53.up_proj", "model.layers.44.mlp.experts.54.up_proj", "model.layers.44.mlp.experts.55.up_proj", "model.layers.44.mlp.experts.56.up_proj", "model.layers.44.mlp.experts.57.up_proj", "model.layers.44.mlp.experts.58.up_proj", "model.layers.44.mlp.experts.59.up_proj", "model.layers.44.mlp.experts.60.up_proj", "model.layers.44.mlp.experts.61.up_proj", "model.layers.44.mlp.experts.62.up_proj", "model.layers.44.mlp.experts.63.up_proj", "model.layers.44.mlp.experts.64.up_proj", "model.layers.44.mlp.experts.65.up_proj", "model.layers.44.mlp.experts.66.up_proj", "model.layers.44.mlp.experts.67.up_proj", "model.layers.44.mlp.experts.68.up_proj", "model.layers.44.mlp.experts.69.up_proj", "model.layers.44.mlp.experts.70.up_proj", "model.layers.44.mlp.experts.71.up_proj", "model.layers.44.mlp.experts.72.up_proj", "model.layers.44.mlp.experts.73.up_proj", "model.layers.44.mlp.experts.74.up_proj", "model.layers.44.mlp.experts.75.up_proj", "model.layers.44.mlp.experts.76.up_proj", "model.layers.44.mlp.experts.77.up_proj", "model.layers.44.mlp.experts.78.up_proj", "model.layers.44.mlp.experts.79.up_proj", "model.layers.44.mlp.experts.80.up_proj", "model.layers.44.mlp.experts.81.up_proj", "model.layers.44.mlp.experts.82.up_proj", "model.layers.44.mlp.experts.83.up_proj", "model.layers.44.mlp.experts.84.up_proj", "model.layers.44.mlp.experts.85.up_proj", "model.layers.44.mlp.experts.86.up_proj", "model.layers.44.mlp.experts.87.up_proj", "model.layers.44.mlp.experts.88.up_proj", "model.layers.44.mlp.experts.89.up_proj", "model.layers.44.mlp.experts.90.up_proj", "model.layers.44.mlp.experts.91.up_proj", "model.layers.44.mlp.experts.92.up_proj", "model.layers.44.mlp.experts.93.up_proj", "model.layers.44.mlp.experts.94.up_proj", "model.layers.44.mlp.experts.95.up_proj", "model.layers.44.mlp.experts.96.up_proj", "model.layers.44.mlp.experts.97.up_proj", "model.layers.44.mlp.experts.98.up_proj", "model.layers.44.mlp.experts.99.up_proj", "model.layers.44.mlp.experts.100.up_proj", "model.layers.44.mlp.experts.101.up_proj", "model.layers.44.mlp.experts.102.up_proj", "model.layers.44.mlp.experts.103.up_proj", "model.layers.44.mlp.experts.104.up_proj", "model.layers.44.mlp.experts.105.up_proj", "model.layers.44.mlp.experts.106.up_proj", "model.layers.44.mlp.experts.107.up_proj", "model.layers.44.mlp.experts.108.up_proj", "model.layers.44.mlp.experts.109.up_proj", "model.layers.44.mlp.experts.110.up_proj", "model.layers.44.mlp.experts.111.up_proj", "model.layers.44.mlp.experts.112.up_proj", "model.layers.44.mlp.experts.113.up_proj", "model.layers.44.mlp.experts.114.up_proj", "model.layers.44.mlp.experts.115.up_proj", "model.layers.44.mlp.experts.116.up_proj", "model.layers.44.mlp.experts.117.up_proj", "model.layers.44.mlp.experts.118.up_proj", "model.layers.44.mlp.experts.119.up_proj", "model.layers.44.mlp.experts.120.up_proj", "model.layers.44.mlp.experts.121.up_proj", "model.layers.44.mlp.experts.122.up_proj", "model.layers.44.mlp.experts.123.up_proj", "model.layers.44.mlp.experts.124.up_proj", "model.layers.44.mlp.experts.125.up_proj", "model.layers.44.mlp.experts.126.up_proj", "model.layers.44.mlp.experts.127.up_proj", "model.layers.44.mlp.experts.128.up_proj", "model.layers.44.mlp.experts.129.up_proj", "model.layers.44.mlp.experts.130.up_proj", "model.layers.44.mlp.experts.131.up_proj", "model.layers.44.mlp.experts.132.up_proj", "model.layers.44.mlp.experts.133.up_proj", "model.layers.44.mlp.experts.134.up_proj", "model.layers.44.mlp.experts.135.up_proj", "model.layers.44.mlp.experts.136.up_proj", "model.layers.44.mlp.experts.137.up_proj", "model.layers.44.mlp.experts.138.up_proj", "model.layers.44.mlp.experts.139.up_proj", "model.layers.44.mlp.experts.140.up_proj", "model.layers.44.mlp.experts.141.up_proj", "model.layers.44.mlp.experts.142.up_proj", "model.layers.44.mlp.experts.143.up_proj", "model.layers.44.mlp.experts.144.up_proj", "model.layers.44.mlp.experts.145.up_proj", "model.layers.44.mlp.experts.146.up_proj", "model.layers.44.mlp.experts.147.up_proj", "model.layers.44.mlp.experts.148.up_proj", "model.layers.44.mlp.experts.149.up_proj", "model.layers.44.mlp.experts.150.up_proj", "model.layers.44.mlp.experts.151.up_proj", "model.layers.44.mlp.experts.152.up_proj", "model.layers.44.mlp.experts.153.up_proj", "model.layers.44.mlp.experts.154.up_proj", "model.layers.44.mlp.experts.155.up_proj", "model.layers.44.mlp.experts.156.up_proj", "model.layers.44.mlp.experts.157.up_proj", "model.layers.44.mlp.experts.158.up_proj", "model.layers.44.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.0240590199828148e-05, "dbits": 2516582400 }, { "dkld": -1.0459031909703168e-05, "dbits": 5033164800 } ] }, { "idx": 266, "layers": [ "model.layers.44.mlp.experts.0.down_proj", "model.layers.44.mlp.experts.1.down_proj", "model.layers.44.mlp.experts.2.down_proj", "model.layers.44.mlp.experts.3.down_proj", "model.layers.44.mlp.experts.4.down_proj", "model.layers.44.mlp.experts.5.down_proj", "model.layers.44.mlp.experts.6.down_proj", "model.layers.44.mlp.experts.7.down_proj", "model.layers.44.mlp.experts.8.down_proj", "model.layers.44.mlp.experts.9.down_proj", "model.layers.44.mlp.experts.10.down_proj", "model.layers.44.mlp.experts.11.down_proj", "model.layers.44.mlp.experts.12.down_proj", "model.layers.44.mlp.experts.13.down_proj", "model.layers.44.mlp.experts.14.down_proj", "model.layers.44.mlp.experts.15.down_proj", "model.layers.44.mlp.experts.16.down_proj", "model.layers.44.mlp.experts.17.down_proj", "model.layers.44.mlp.experts.18.down_proj", "model.layers.44.mlp.experts.19.down_proj", "model.layers.44.mlp.experts.20.down_proj", "model.layers.44.mlp.experts.21.down_proj", "model.layers.44.mlp.experts.22.down_proj", "model.layers.44.mlp.experts.23.down_proj", "model.layers.44.mlp.experts.24.down_proj", "model.layers.44.mlp.experts.25.down_proj", "model.layers.44.mlp.experts.26.down_proj", "model.layers.44.mlp.experts.27.down_proj", "model.layers.44.mlp.experts.28.down_proj", "model.layers.44.mlp.experts.29.down_proj", "model.layers.44.mlp.experts.30.down_proj", "model.layers.44.mlp.experts.31.down_proj", "model.layers.44.mlp.experts.32.down_proj", "model.layers.44.mlp.experts.33.down_proj", "model.layers.44.mlp.experts.34.down_proj", "model.layers.44.mlp.experts.35.down_proj", "model.layers.44.mlp.experts.36.down_proj", "model.layers.44.mlp.experts.37.down_proj", "model.layers.44.mlp.experts.38.down_proj", "model.layers.44.mlp.experts.39.down_proj", "model.layers.44.mlp.experts.40.down_proj", "model.layers.44.mlp.experts.41.down_proj", "model.layers.44.mlp.experts.42.down_proj", "model.layers.44.mlp.experts.43.down_proj", "model.layers.44.mlp.experts.44.down_proj", "model.layers.44.mlp.experts.45.down_proj", "model.layers.44.mlp.experts.46.down_proj", "model.layers.44.mlp.experts.47.down_proj", "model.layers.44.mlp.experts.48.down_proj", "model.layers.44.mlp.experts.49.down_proj", "model.layers.44.mlp.experts.50.down_proj", "model.layers.44.mlp.experts.51.down_proj", "model.layers.44.mlp.experts.52.down_proj", "model.layers.44.mlp.experts.53.down_proj", "model.layers.44.mlp.experts.54.down_proj", "model.layers.44.mlp.experts.55.down_proj", "model.layers.44.mlp.experts.56.down_proj", "model.layers.44.mlp.experts.57.down_proj", "model.layers.44.mlp.experts.58.down_proj", "model.layers.44.mlp.experts.59.down_proj", "model.layers.44.mlp.experts.60.down_proj", "model.layers.44.mlp.experts.61.down_proj", "model.layers.44.mlp.experts.62.down_proj", "model.layers.44.mlp.experts.63.down_proj", "model.layers.44.mlp.experts.64.down_proj", "model.layers.44.mlp.experts.65.down_proj", "model.layers.44.mlp.experts.66.down_proj", "model.layers.44.mlp.experts.67.down_proj", "model.layers.44.mlp.experts.68.down_proj", "model.layers.44.mlp.experts.69.down_proj", "model.layers.44.mlp.experts.70.down_proj", "model.layers.44.mlp.experts.71.down_proj", "model.layers.44.mlp.experts.72.down_proj", "model.layers.44.mlp.experts.73.down_proj", "model.layers.44.mlp.experts.74.down_proj", "model.layers.44.mlp.experts.75.down_proj", "model.layers.44.mlp.experts.76.down_proj", "model.layers.44.mlp.experts.77.down_proj", "model.layers.44.mlp.experts.78.down_proj", "model.layers.44.mlp.experts.79.down_proj", "model.layers.44.mlp.experts.80.down_proj", "model.layers.44.mlp.experts.81.down_proj", "model.layers.44.mlp.experts.82.down_proj", "model.layers.44.mlp.experts.83.down_proj", "model.layers.44.mlp.experts.84.down_proj", "model.layers.44.mlp.experts.85.down_proj", "model.layers.44.mlp.experts.86.down_proj", "model.layers.44.mlp.experts.87.down_proj", "model.layers.44.mlp.experts.88.down_proj", "model.layers.44.mlp.experts.89.down_proj", "model.layers.44.mlp.experts.90.down_proj", "model.layers.44.mlp.experts.91.down_proj", "model.layers.44.mlp.experts.92.down_proj", "model.layers.44.mlp.experts.93.down_proj", "model.layers.44.mlp.experts.94.down_proj", "model.layers.44.mlp.experts.95.down_proj", "model.layers.44.mlp.experts.96.down_proj", "model.layers.44.mlp.experts.97.down_proj", "model.layers.44.mlp.experts.98.down_proj", "model.layers.44.mlp.experts.99.down_proj", "model.layers.44.mlp.experts.100.down_proj", "model.layers.44.mlp.experts.101.down_proj", "model.layers.44.mlp.experts.102.down_proj", "model.layers.44.mlp.experts.103.down_proj", "model.layers.44.mlp.experts.104.down_proj", "model.layers.44.mlp.experts.105.down_proj", "model.layers.44.mlp.experts.106.down_proj", "model.layers.44.mlp.experts.107.down_proj", "model.layers.44.mlp.experts.108.down_proj", "model.layers.44.mlp.experts.109.down_proj", "model.layers.44.mlp.experts.110.down_proj", "model.layers.44.mlp.experts.111.down_proj", "model.layers.44.mlp.experts.112.down_proj", "model.layers.44.mlp.experts.113.down_proj", "model.layers.44.mlp.experts.114.down_proj", "model.layers.44.mlp.experts.115.down_proj", "model.layers.44.mlp.experts.116.down_proj", "model.layers.44.mlp.experts.117.down_proj", "model.layers.44.mlp.experts.118.down_proj", "model.layers.44.mlp.experts.119.down_proj", "model.layers.44.mlp.experts.120.down_proj", "model.layers.44.mlp.experts.121.down_proj", "model.layers.44.mlp.experts.122.down_proj", "model.layers.44.mlp.experts.123.down_proj", "model.layers.44.mlp.experts.124.down_proj", "model.layers.44.mlp.experts.125.down_proj", "model.layers.44.mlp.experts.126.down_proj", "model.layers.44.mlp.experts.127.down_proj", "model.layers.44.mlp.experts.128.down_proj", "model.layers.44.mlp.experts.129.down_proj", "model.layers.44.mlp.experts.130.down_proj", "model.layers.44.mlp.experts.131.down_proj", "model.layers.44.mlp.experts.132.down_proj", "model.layers.44.mlp.experts.133.down_proj", "model.layers.44.mlp.experts.134.down_proj", "model.layers.44.mlp.experts.135.down_proj", "model.layers.44.mlp.experts.136.down_proj", "model.layers.44.mlp.experts.137.down_proj", "model.layers.44.mlp.experts.138.down_proj", "model.layers.44.mlp.experts.139.down_proj", "model.layers.44.mlp.experts.140.down_proj", "model.layers.44.mlp.experts.141.down_proj", "model.layers.44.mlp.experts.142.down_proj", "model.layers.44.mlp.experts.143.down_proj", "model.layers.44.mlp.experts.144.down_proj", "model.layers.44.mlp.experts.145.down_proj", "model.layers.44.mlp.experts.146.down_proj", "model.layers.44.mlp.experts.147.down_proj", "model.layers.44.mlp.experts.148.down_proj", "model.layers.44.mlp.experts.149.down_proj", "model.layers.44.mlp.experts.150.down_proj", "model.layers.44.mlp.experts.151.down_proj", "model.layers.44.mlp.experts.152.down_proj", "model.layers.44.mlp.experts.153.down_proj", "model.layers.44.mlp.experts.154.down_proj", "model.layers.44.mlp.experts.155.down_proj", "model.layers.44.mlp.experts.156.down_proj", "model.layers.44.mlp.experts.157.down_proj", "model.layers.44.mlp.experts.158.down_proj", "model.layers.44.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 1.9704923033721233e-06, "dbits": 1258291200 }, { "dkld": -8.954922668634457e-06, "dbits": 2516582400 } ] }, { "idx": 267, "layers": [ "model.layers.45.self_attn.q_proj" ], "candidates": [ { "dkld": 5.0686532631516457e-05, "dbits": 62914560 }, { "dkld": 4.653367213904892e-05, "dbits": 125829120 } ] }, { "idx": 268, "layers": [ "model.layers.45.self_attn.k_proj", "model.layers.45.self_attn.v_proj" ], "candidates": [ { "dkld": -6.46540429443121e-05, "dbits": 10485760 }, { "dkld": -2.7330592274665833e-05, "dbits": 20971520 } ] }, { "idx": 269, "layers": [ "model.layers.45.self_attn.o_proj" ], "candidates": [ { "dkld": 2.9434636235238162e-05, "dbits": 62914560 }, { "dkld": -1.0699825361370693e-05, "dbits": 125829120 } ] }, { "idx": 270, "layers": [ "model.layers.45.mlp.shared_experts.gate_proj", "model.layers.45.mlp.shared_experts.up_proj", "model.layers.45.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 6.242305971682072e-06, "dbits": 23592960 }, { "dkld": -2.5975424796341462e-05, "dbits": 47185920 } ] }, { "idx": 271, "layers": [ "model.layers.45.mlp.experts.0.gate_proj", "model.layers.45.mlp.experts.1.gate_proj", "model.layers.45.mlp.experts.2.gate_proj", "model.layers.45.mlp.experts.3.gate_proj", "model.layers.45.mlp.experts.4.gate_proj", "model.layers.45.mlp.experts.5.gate_proj", "model.layers.45.mlp.experts.6.gate_proj", "model.layers.45.mlp.experts.7.gate_proj", "model.layers.45.mlp.experts.8.gate_proj", "model.layers.45.mlp.experts.9.gate_proj", "model.layers.45.mlp.experts.10.gate_proj", "model.layers.45.mlp.experts.11.gate_proj", "model.layers.45.mlp.experts.12.gate_proj", "model.layers.45.mlp.experts.13.gate_proj", "model.layers.45.mlp.experts.14.gate_proj", "model.layers.45.mlp.experts.15.gate_proj", "model.layers.45.mlp.experts.16.gate_proj", "model.layers.45.mlp.experts.17.gate_proj", "model.layers.45.mlp.experts.18.gate_proj", "model.layers.45.mlp.experts.19.gate_proj", "model.layers.45.mlp.experts.20.gate_proj", "model.layers.45.mlp.experts.21.gate_proj", "model.layers.45.mlp.experts.22.gate_proj", "model.layers.45.mlp.experts.23.gate_proj", "model.layers.45.mlp.experts.24.gate_proj", "model.layers.45.mlp.experts.25.gate_proj", "model.layers.45.mlp.experts.26.gate_proj", "model.layers.45.mlp.experts.27.gate_proj", "model.layers.45.mlp.experts.28.gate_proj", "model.layers.45.mlp.experts.29.gate_proj", "model.layers.45.mlp.experts.30.gate_proj", "model.layers.45.mlp.experts.31.gate_proj", "model.layers.45.mlp.experts.32.gate_proj", "model.layers.45.mlp.experts.33.gate_proj", "model.layers.45.mlp.experts.34.gate_proj", "model.layers.45.mlp.experts.35.gate_proj", "model.layers.45.mlp.experts.36.gate_proj", "model.layers.45.mlp.experts.37.gate_proj", "model.layers.45.mlp.experts.38.gate_proj", "model.layers.45.mlp.experts.39.gate_proj", "model.layers.45.mlp.experts.40.gate_proj", "model.layers.45.mlp.experts.41.gate_proj", "model.layers.45.mlp.experts.42.gate_proj", "model.layers.45.mlp.experts.43.gate_proj", "model.layers.45.mlp.experts.44.gate_proj", "model.layers.45.mlp.experts.45.gate_proj", "model.layers.45.mlp.experts.46.gate_proj", "model.layers.45.mlp.experts.47.gate_proj", "model.layers.45.mlp.experts.48.gate_proj", "model.layers.45.mlp.experts.49.gate_proj", "model.layers.45.mlp.experts.50.gate_proj", "model.layers.45.mlp.experts.51.gate_proj", "model.layers.45.mlp.experts.52.gate_proj", "model.layers.45.mlp.experts.53.gate_proj", "model.layers.45.mlp.experts.54.gate_proj", "model.layers.45.mlp.experts.55.gate_proj", "model.layers.45.mlp.experts.56.gate_proj", "model.layers.45.mlp.experts.57.gate_proj", "model.layers.45.mlp.experts.58.gate_proj", "model.layers.45.mlp.experts.59.gate_proj", "model.layers.45.mlp.experts.60.gate_proj", "model.layers.45.mlp.experts.61.gate_proj", "model.layers.45.mlp.experts.62.gate_proj", "model.layers.45.mlp.experts.63.gate_proj", "model.layers.45.mlp.experts.64.gate_proj", "model.layers.45.mlp.experts.65.gate_proj", "model.layers.45.mlp.experts.66.gate_proj", "model.layers.45.mlp.experts.67.gate_proj", "model.layers.45.mlp.experts.68.gate_proj", "model.layers.45.mlp.experts.69.gate_proj", "model.layers.45.mlp.experts.70.gate_proj", "model.layers.45.mlp.experts.71.gate_proj", "model.layers.45.mlp.experts.72.gate_proj", "model.layers.45.mlp.experts.73.gate_proj", "model.layers.45.mlp.experts.74.gate_proj", "model.layers.45.mlp.experts.75.gate_proj", "model.layers.45.mlp.experts.76.gate_proj", "model.layers.45.mlp.experts.77.gate_proj", "model.layers.45.mlp.experts.78.gate_proj", "model.layers.45.mlp.experts.79.gate_proj", "model.layers.45.mlp.experts.80.gate_proj", "model.layers.45.mlp.experts.81.gate_proj", "model.layers.45.mlp.experts.82.gate_proj", "model.layers.45.mlp.experts.83.gate_proj", "model.layers.45.mlp.experts.84.gate_proj", "model.layers.45.mlp.experts.85.gate_proj", "model.layers.45.mlp.experts.86.gate_proj", "model.layers.45.mlp.experts.87.gate_proj", "model.layers.45.mlp.experts.88.gate_proj", "model.layers.45.mlp.experts.89.gate_proj", "model.layers.45.mlp.experts.90.gate_proj", "model.layers.45.mlp.experts.91.gate_proj", "model.layers.45.mlp.experts.92.gate_proj", "model.layers.45.mlp.experts.93.gate_proj", "model.layers.45.mlp.experts.94.gate_proj", "model.layers.45.mlp.experts.95.gate_proj", "model.layers.45.mlp.experts.96.gate_proj", "model.layers.45.mlp.experts.97.gate_proj", "model.layers.45.mlp.experts.98.gate_proj", "model.layers.45.mlp.experts.99.gate_proj", "model.layers.45.mlp.experts.100.gate_proj", "model.layers.45.mlp.experts.101.gate_proj", "model.layers.45.mlp.experts.102.gate_proj", "model.layers.45.mlp.experts.103.gate_proj", "model.layers.45.mlp.experts.104.gate_proj", "model.layers.45.mlp.experts.105.gate_proj", "model.layers.45.mlp.experts.106.gate_proj", "model.layers.45.mlp.experts.107.gate_proj", "model.layers.45.mlp.experts.108.gate_proj", "model.layers.45.mlp.experts.109.gate_proj", "model.layers.45.mlp.experts.110.gate_proj", "model.layers.45.mlp.experts.111.gate_proj", "model.layers.45.mlp.experts.112.gate_proj", "model.layers.45.mlp.experts.113.gate_proj", "model.layers.45.mlp.experts.114.gate_proj", "model.layers.45.mlp.experts.115.gate_proj", "model.layers.45.mlp.experts.116.gate_proj", "model.layers.45.mlp.experts.117.gate_proj", "model.layers.45.mlp.experts.118.gate_proj", "model.layers.45.mlp.experts.119.gate_proj", "model.layers.45.mlp.experts.120.gate_proj", "model.layers.45.mlp.experts.121.gate_proj", "model.layers.45.mlp.experts.122.gate_proj", "model.layers.45.mlp.experts.123.gate_proj", "model.layers.45.mlp.experts.124.gate_proj", "model.layers.45.mlp.experts.125.gate_proj", "model.layers.45.mlp.experts.126.gate_proj", "model.layers.45.mlp.experts.127.gate_proj", "model.layers.45.mlp.experts.128.gate_proj", "model.layers.45.mlp.experts.129.gate_proj", "model.layers.45.mlp.experts.130.gate_proj", "model.layers.45.mlp.experts.131.gate_proj", "model.layers.45.mlp.experts.132.gate_proj", "model.layers.45.mlp.experts.133.gate_proj", "model.layers.45.mlp.experts.134.gate_proj", "model.layers.45.mlp.experts.135.gate_proj", "model.layers.45.mlp.experts.136.gate_proj", "model.layers.45.mlp.experts.137.gate_proj", "model.layers.45.mlp.experts.138.gate_proj", "model.layers.45.mlp.experts.139.gate_proj", "model.layers.45.mlp.experts.140.gate_proj", "model.layers.45.mlp.experts.141.gate_proj", "model.layers.45.mlp.experts.142.gate_proj", "model.layers.45.mlp.experts.143.gate_proj", "model.layers.45.mlp.experts.144.gate_proj", "model.layers.45.mlp.experts.145.gate_proj", "model.layers.45.mlp.experts.146.gate_proj", "model.layers.45.mlp.experts.147.gate_proj", "model.layers.45.mlp.experts.148.gate_proj", "model.layers.45.mlp.experts.149.gate_proj", "model.layers.45.mlp.experts.150.gate_proj", "model.layers.45.mlp.experts.151.gate_proj", "model.layers.45.mlp.experts.152.gate_proj", "model.layers.45.mlp.experts.153.gate_proj", "model.layers.45.mlp.experts.154.gate_proj", "model.layers.45.mlp.experts.155.gate_proj", "model.layers.45.mlp.experts.156.gate_proj", "model.layers.45.mlp.experts.157.gate_proj", "model.layers.45.mlp.experts.158.gate_proj", "model.layers.45.mlp.experts.159.gate_proj", "model.layers.45.mlp.experts.0.up_proj", "model.layers.45.mlp.experts.1.up_proj", "model.layers.45.mlp.experts.2.up_proj", "model.layers.45.mlp.experts.3.up_proj", "model.layers.45.mlp.experts.4.up_proj", "model.layers.45.mlp.experts.5.up_proj", "model.layers.45.mlp.experts.6.up_proj", "model.layers.45.mlp.experts.7.up_proj", "model.layers.45.mlp.experts.8.up_proj", "model.layers.45.mlp.experts.9.up_proj", "model.layers.45.mlp.experts.10.up_proj", "model.layers.45.mlp.experts.11.up_proj", "model.layers.45.mlp.experts.12.up_proj", "model.layers.45.mlp.experts.13.up_proj", "model.layers.45.mlp.experts.14.up_proj", "model.layers.45.mlp.experts.15.up_proj", "model.layers.45.mlp.experts.16.up_proj", "model.layers.45.mlp.experts.17.up_proj", "model.layers.45.mlp.experts.18.up_proj", "model.layers.45.mlp.experts.19.up_proj", "model.layers.45.mlp.experts.20.up_proj", "model.layers.45.mlp.experts.21.up_proj", "model.layers.45.mlp.experts.22.up_proj", "model.layers.45.mlp.experts.23.up_proj", "model.layers.45.mlp.experts.24.up_proj", "model.layers.45.mlp.experts.25.up_proj", "model.layers.45.mlp.experts.26.up_proj", "model.layers.45.mlp.experts.27.up_proj", "model.layers.45.mlp.experts.28.up_proj", "model.layers.45.mlp.experts.29.up_proj", "model.layers.45.mlp.experts.30.up_proj", "model.layers.45.mlp.experts.31.up_proj", "model.layers.45.mlp.experts.32.up_proj", "model.layers.45.mlp.experts.33.up_proj", "model.layers.45.mlp.experts.34.up_proj", "model.layers.45.mlp.experts.35.up_proj", "model.layers.45.mlp.experts.36.up_proj", "model.layers.45.mlp.experts.37.up_proj", "model.layers.45.mlp.experts.38.up_proj", "model.layers.45.mlp.experts.39.up_proj", "model.layers.45.mlp.experts.40.up_proj", "model.layers.45.mlp.experts.41.up_proj", "model.layers.45.mlp.experts.42.up_proj", "model.layers.45.mlp.experts.43.up_proj", "model.layers.45.mlp.experts.44.up_proj", "model.layers.45.mlp.experts.45.up_proj", "model.layers.45.mlp.experts.46.up_proj", "model.layers.45.mlp.experts.47.up_proj", "model.layers.45.mlp.experts.48.up_proj", "model.layers.45.mlp.experts.49.up_proj", "model.layers.45.mlp.experts.50.up_proj", "model.layers.45.mlp.experts.51.up_proj", "model.layers.45.mlp.experts.52.up_proj", "model.layers.45.mlp.experts.53.up_proj", "model.layers.45.mlp.experts.54.up_proj", "model.layers.45.mlp.experts.55.up_proj", "model.layers.45.mlp.experts.56.up_proj", "model.layers.45.mlp.experts.57.up_proj", "model.layers.45.mlp.experts.58.up_proj", "model.layers.45.mlp.experts.59.up_proj", "model.layers.45.mlp.experts.60.up_proj", "model.layers.45.mlp.experts.61.up_proj", "model.layers.45.mlp.experts.62.up_proj", "model.layers.45.mlp.experts.63.up_proj", "model.layers.45.mlp.experts.64.up_proj", "model.layers.45.mlp.experts.65.up_proj", "model.layers.45.mlp.experts.66.up_proj", "model.layers.45.mlp.experts.67.up_proj", "model.layers.45.mlp.experts.68.up_proj", "model.layers.45.mlp.experts.69.up_proj", "model.layers.45.mlp.experts.70.up_proj", "model.layers.45.mlp.experts.71.up_proj", "model.layers.45.mlp.experts.72.up_proj", "model.layers.45.mlp.experts.73.up_proj", "model.layers.45.mlp.experts.74.up_proj", "model.layers.45.mlp.experts.75.up_proj", "model.layers.45.mlp.experts.76.up_proj", "model.layers.45.mlp.experts.77.up_proj", "model.layers.45.mlp.experts.78.up_proj", "model.layers.45.mlp.experts.79.up_proj", "model.layers.45.mlp.experts.80.up_proj", "model.layers.45.mlp.experts.81.up_proj", "model.layers.45.mlp.experts.82.up_proj", "model.layers.45.mlp.experts.83.up_proj", "model.layers.45.mlp.experts.84.up_proj", "model.layers.45.mlp.experts.85.up_proj", "model.layers.45.mlp.experts.86.up_proj", "model.layers.45.mlp.experts.87.up_proj", "model.layers.45.mlp.experts.88.up_proj", "model.layers.45.mlp.experts.89.up_proj", "model.layers.45.mlp.experts.90.up_proj", "model.layers.45.mlp.experts.91.up_proj", "model.layers.45.mlp.experts.92.up_proj", "model.layers.45.mlp.experts.93.up_proj", "model.layers.45.mlp.experts.94.up_proj", "model.layers.45.mlp.experts.95.up_proj", "model.layers.45.mlp.experts.96.up_proj", "model.layers.45.mlp.experts.97.up_proj", "model.layers.45.mlp.experts.98.up_proj", "model.layers.45.mlp.experts.99.up_proj", "model.layers.45.mlp.experts.100.up_proj", "model.layers.45.mlp.experts.101.up_proj", "model.layers.45.mlp.experts.102.up_proj", "model.layers.45.mlp.experts.103.up_proj", "model.layers.45.mlp.experts.104.up_proj", "model.layers.45.mlp.experts.105.up_proj", "model.layers.45.mlp.experts.106.up_proj", "model.layers.45.mlp.experts.107.up_proj", "model.layers.45.mlp.experts.108.up_proj", "model.layers.45.mlp.experts.109.up_proj", "model.layers.45.mlp.experts.110.up_proj", "model.layers.45.mlp.experts.111.up_proj", "model.layers.45.mlp.experts.112.up_proj", "model.layers.45.mlp.experts.113.up_proj", "model.layers.45.mlp.experts.114.up_proj", "model.layers.45.mlp.experts.115.up_proj", "model.layers.45.mlp.experts.116.up_proj", "model.layers.45.mlp.experts.117.up_proj", "model.layers.45.mlp.experts.118.up_proj", "model.layers.45.mlp.experts.119.up_proj", "model.layers.45.mlp.experts.120.up_proj", "model.layers.45.mlp.experts.121.up_proj", "model.layers.45.mlp.experts.122.up_proj", "model.layers.45.mlp.experts.123.up_proj", "model.layers.45.mlp.experts.124.up_proj", "model.layers.45.mlp.experts.125.up_proj", "model.layers.45.mlp.experts.126.up_proj", "model.layers.45.mlp.experts.127.up_proj", "model.layers.45.mlp.experts.128.up_proj", "model.layers.45.mlp.experts.129.up_proj", "model.layers.45.mlp.experts.130.up_proj", "model.layers.45.mlp.experts.131.up_proj", "model.layers.45.mlp.experts.132.up_proj", "model.layers.45.mlp.experts.133.up_proj", "model.layers.45.mlp.experts.134.up_proj", "model.layers.45.mlp.experts.135.up_proj", "model.layers.45.mlp.experts.136.up_proj", "model.layers.45.mlp.experts.137.up_proj", "model.layers.45.mlp.experts.138.up_proj", "model.layers.45.mlp.experts.139.up_proj", "model.layers.45.mlp.experts.140.up_proj", "model.layers.45.mlp.experts.141.up_proj", "model.layers.45.mlp.experts.142.up_proj", "model.layers.45.mlp.experts.143.up_proj", "model.layers.45.mlp.experts.144.up_proj", "model.layers.45.mlp.experts.145.up_proj", "model.layers.45.mlp.experts.146.up_proj", "model.layers.45.mlp.experts.147.up_proj", "model.layers.45.mlp.experts.148.up_proj", "model.layers.45.mlp.experts.149.up_proj", "model.layers.45.mlp.experts.150.up_proj", "model.layers.45.mlp.experts.151.up_proj", "model.layers.45.mlp.experts.152.up_proj", "model.layers.45.mlp.experts.153.up_proj", "model.layers.45.mlp.experts.154.up_proj", "model.layers.45.mlp.experts.155.up_proj", "model.layers.45.mlp.experts.156.up_proj", "model.layers.45.mlp.experts.157.up_proj", "model.layers.45.mlp.experts.158.up_proj", "model.layers.45.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.931823790073464e-05, "dbits": 2516582400 }, { "dkld": 6.377953104675163e-06, "dbits": 5033164800 } ] }, { "idx": 272, "layers": [ "model.layers.45.mlp.experts.0.down_proj", "model.layers.45.mlp.experts.1.down_proj", "model.layers.45.mlp.experts.2.down_proj", "model.layers.45.mlp.experts.3.down_proj", "model.layers.45.mlp.experts.4.down_proj", "model.layers.45.mlp.experts.5.down_proj", "model.layers.45.mlp.experts.6.down_proj", "model.layers.45.mlp.experts.7.down_proj", "model.layers.45.mlp.experts.8.down_proj", "model.layers.45.mlp.experts.9.down_proj", "model.layers.45.mlp.experts.10.down_proj", "model.layers.45.mlp.experts.11.down_proj", "model.layers.45.mlp.experts.12.down_proj", "model.layers.45.mlp.experts.13.down_proj", "model.layers.45.mlp.experts.14.down_proj", "model.layers.45.mlp.experts.15.down_proj", "model.layers.45.mlp.experts.16.down_proj", "model.layers.45.mlp.experts.17.down_proj", "model.layers.45.mlp.experts.18.down_proj", "model.layers.45.mlp.experts.19.down_proj", "model.layers.45.mlp.experts.20.down_proj", "model.layers.45.mlp.experts.21.down_proj", "model.layers.45.mlp.experts.22.down_proj", "model.layers.45.mlp.experts.23.down_proj", "model.layers.45.mlp.experts.24.down_proj", "model.layers.45.mlp.experts.25.down_proj", "model.layers.45.mlp.experts.26.down_proj", "model.layers.45.mlp.experts.27.down_proj", "model.layers.45.mlp.experts.28.down_proj", "model.layers.45.mlp.experts.29.down_proj", "model.layers.45.mlp.experts.30.down_proj", "model.layers.45.mlp.experts.31.down_proj", "model.layers.45.mlp.experts.32.down_proj", "model.layers.45.mlp.experts.33.down_proj", "model.layers.45.mlp.experts.34.down_proj", "model.layers.45.mlp.experts.35.down_proj", "model.layers.45.mlp.experts.36.down_proj", "model.layers.45.mlp.experts.37.down_proj", "model.layers.45.mlp.experts.38.down_proj", "model.layers.45.mlp.experts.39.down_proj", "model.layers.45.mlp.experts.40.down_proj", "model.layers.45.mlp.experts.41.down_proj", "model.layers.45.mlp.experts.42.down_proj", "model.layers.45.mlp.experts.43.down_proj", "model.layers.45.mlp.experts.44.down_proj", "model.layers.45.mlp.experts.45.down_proj", "model.layers.45.mlp.experts.46.down_proj", "model.layers.45.mlp.experts.47.down_proj", "model.layers.45.mlp.experts.48.down_proj", "model.layers.45.mlp.experts.49.down_proj", "model.layers.45.mlp.experts.50.down_proj", "model.layers.45.mlp.experts.51.down_proj", "model.layers.45.mlp.experts.52.down_proj", "model.layers.45.mlp.experts.53.down_proj", "model.layers.45.mlp.experts.54.down_proj", "model.layers.45.mlp.experts.55.down_proj", "model.layers.45.mlp.experts.56.down_proj", "model.layers.45.mlp.experts.57.down_proj", "model.layers.45.mlp.experts.58.down_proj", "model.layers.45.mlp.experts.59.down_proj", "model.layers.45.mlp.experts.60.down_proj", "model.layers.45.mlp.experts.61.down_proj", "model.layers.45.mlp.experts.62.down_proj", "model.layers.45.mlp.experts.63.down_proj", "model.layers.45.mlp.experts.64.down_proj", "model.layers.45.mlp.experts.65.down_proj", "model.layers.45.mlp.experts.66.down_proj", "model.layers.45.mlp.experts.67.down_proj", "model.layers.45.mlp.experts.68.down_proj", "model.layers.45.mlp.experts.69.down_proj", "model.layers.45.mlp.experts.70.down_proj", "model.layers.45.mlp.experts.71.down_proj", "model.layers.45.mlp.experts.72.down_proj", "model.layers.45.mlp.experts.73.down_proj", "model.layers.45.mlp.experts.74.down_proj", "model.layers.45.mlp.experts.75.down_proj", "model.layers.45.mlp.experts.76.down_proj", "model.layers.45.mlp.experts.77.down_proj", "model.layers.45.mlp.experts.78.down_proj", "model.layers.45.mlp.experts.79.down_proj", "model.layers.45.mlp.experts.80.down_proj", "model.layers.45.mlp.experts.81.down_proj", "model.layers.45.mlp.experts.82.down_proj", "model.layers.45.mlp.experts.83.down_proj", "model.layers.45.mlp.experts.84.down_proj", "model.layers.45.mlp.experts.85.down_proj", "model.layers.45.mlp.experts.86.down_proj", "model.layers.45.mlp.experts.87.down_proj", "model.layers.45.mlp.experts.88.down_proj", "model.layers.45.mlp.experts.89.down_proj", "model.layers.45.mlp.experts.90.down_proj", "model.layers.45.mlp.experts.91.down_proj", "model.layers.45.mlp.experts.92.down_proj", "model.layers.45.mlp.experts.93.down_proj", "model.layers.45.mlp.experts.94.down_proj", "model.layers.45.mlp.experts.95.down_proj", "model.layers.45.mlp.experts.96.down_proj", "model.layers.45.mlp.experts.97.down_proj", "model.layers.45.mlp.experts.98.down_proj", "model.layers.45.mlp.experts.99.down_proj", "model.layers.45.mlp.experts.100.down_proj", "model.layers.45.mlp.experts.101.down_proj", "model.layers.45.mlp.experts.102.down_proj", "model.layers.45.mlp.experts.103.down_proj", "model.layers.45.mlp.experts.104.down_proj", "model.layers.45.mlp.experts.105.down_proj", "model.layers.45.mlp.experts.106.down_proj", "model.layers.45.mlp.experts.107.down_proj", "model.layers.45.mlp.experts.108.down_proj", "model.layers.45.mlp.experts.109.down_proj", "model.layers.45.mlp.experts.110.down_proj", "model.layers.45.mlp.experts.111.down_proj", "model.layers.45.mlp.experts.112.down_proj", "model.layers.45.mlp.experts.113.down_proj", "model.layers.45.mlp.experts.114.down_proj", "model.layers.45.mlp.experts.115.down_proj", "model.layers.45.mlp.experts.116.down_proj", "model.layers.45.mlp.experts.117.down_proj", "model.layers.45.mlp.experts.118.down_proj", "model.layers.45.mlp.experts.119.down_proj", "model.layers.45.mlp.experts.120.down_proj", "model.layers.45.mlp.experts.121.down_proj", "model.layers.45.mlp.experts.122.down_proj", "model.layers.45.mlp.experts.123.down_proj", "model.layers.45.mlp.experts.124.down_proj", "model.layers.45.mlp.experts.125.down_proj", "model.layers.45.mlp.experts.126.down_proj", "model.layers.45.mlp.experts.127.down_proj", "model.layers.45.mlp.experts.128.down_proj", "model.layers.45.mlp.experts.129.down_proj", "model.layers.45.mlp.experts.130.down_proj", "model.layers.45.mlp.experts.131.down_proj", "model.layers.45.mlp.experts.132.down_proj", "model.layers.45.mlp.experts.133.down_proj", "model.layers.45.mlp.experts.134.down_proj", "model.layers.45.mlp.experts.135.down_proj", "model.layers.45.mlp.experts.136.down_proj", "model.layers.45.mlp.experts.137.down_proj", "model.layers.45.mlp.experts.138.down_proj", "model.layers.45.mlp.experts.139.down_proj", "model.layers.45.mlp.experts.140.down_proj", "model.layers.45.mlp.experts.141.down_proj", "model.layers.45.mlp.experts.142.down_proj", "model.layers.45.mlp.experts.143.down_proj", "model.layers.45.mlp.experts.144.down_proj", "model.layers.45.mlp.experts.145.down_proj", "model.layers.45.mlp.experts.146.down_proj", "model.layers.45.mlp.experts.147.down_proj", "model.layers.45.mlp.experts.148.down_proj", "model.layers.45.mlp.experts.149.down_proj", "model.layers.45.mlp.experts.150.down_proj", "model.layers.45.mlp.experts.151.down_proj", "model.layers.45.mlp.experts.152.down_proj", "model.layers.45.mlp.experts.153.down_proj", "model.layers.45.mlp.experts.154.down_proj", "model.layers.45.mlp.experts.155.down_proj", "model.layers.45.mlp.experts.156.down_proj", "model.layers.45.mlp.experts.157.down_proj", "model.layers.45.mlp.experts.158.down_proj", "model.layers.45.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.9897473976016045e-05, "dbits": 1258291200 }, { "dkld": -1.8695765174924286e-05, "dbits": 2516582400 } ] }, { "idx": 273, "layers": [ "model.layers.46.self_attn.q_proj" ], "candidates": [ { "dkld": -0.00011603657621890237, "dbits": 62914560 }, { "dkld": -7.080291397869483e-05, "dbits": 125829120 } ] }, { "idx": 274, "layers": [ "model.layers.46.self_attn.k_proj", "model.layers.46.self_attn.v_proj" ], "candidates": [ { "dkld": 1.0646949522198287e-05, "dbits": 10485760 }, { "dkld": -1.2873020023106488e-05, "dbits": 20971520 } ] }, { "idx": 275, "layers": [ "model.layers.46.self_attn.o_proj" ], "candidates": [ { "dkld": 7.261103019119003e-06, "dbits": 62914560 }, { "dkld": -2.2777821868588677e-07, "dbits": 125829120 } ] }, { "idx": 276, "layers": [ "model.layers.46.mlp.shared_experts.gate_proj", "model.layers.46.mlp.shared_experts.up_proj", "model.layers.46.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -3.165581729262963e-05, "dbits": 23592960 }, { "dkld": -5.4172612726687e-05, "dbits": 47185920 } ] }, { "idx": 277, "layers": [ "model.layers.46.mlp.experts.0.gate_proj", "model.layers.46.mlp.experts.1.gate_proj", "model.layers.46.mlp.experts.2.gate_proj", "model.layers.46.mlp.experts.3.gate_proj", "model.layers.46.mlp.experts.4.gate_proj", "model.layers.46.mlp.experts.5.gate_proj", "model.layers.46.mlp.experts.6.gate_proj", "model.layers.46.mlp.experts.7.gate_proj", "model.layers.46.mlp.experts.8.gate_proj", "model.layers.46.mlp.experts.9.gate_proj", "model.layers.46.mlp.experts.10.gate_proj", "model.layers.46.mlp.experts.11.gate_proj", "model.layers.46.mlp.experts.12.gate_proj", "model.layers.46.mlp.experts.13.gate_proj", "model.layers.46.mlp.experts.14.gate_proj", "model.layers.46.mlp.experts.15.gate_proj", "model.layers.46.mlp.experts.16.gate_proj", "model.layers.46.mlp.experts.17.gate_proj", "model.layers.46.mlp.experts.18.gate_proj", "model.layers.46.mlp.experts.19.gate_proj", "model.layers.46.mlp.experts.20.gate_proj", "model.layers.46.mlp.experts.21.gate_proj", "model.layers.46.mlp.experts.22.gate_proj", "model.layers.46.mlp.experts.23.gate_proj", "model.layers.46.mlp.experts.24.gate_proj", "model.layers.46.mlp.experts.25.gate_proj", "model.layers.46.mlp.experts.26.gate_proj", "model.layers.46.mlp.experts.27.gate_proj", "model.layers.46.mlp.experts.28.gate_proj", "model.layers.46.mlp.experts.29.gate_proj", "model.layers.46.mlp.experts.30.gate_proj", "model.layers.46.mlp.experts.31.gate_proj", "model.layers.46.mlp.experts.32.gate_proj", "model.layers.46.mlp.experts.33.gate_proj", "model.layers.46.mlp.experts.34.gate_proj", "model.layers.46.mlp.experts.35.gate_proj", "model.layers.46.mlp.experts.36.gate_proj", "model.layers.46.mlp.experts.37.gate_proj", "model.layers.46.mlp.experts.38.gate_proj", "model.layers.46.mlp.experts.39.gate_proj", "model.layers.46.mlp.experts.40.gate_proj", "model.layers.46.mlp.experts.41.gate_proj", "model.layers.46.mlp.experts.42.gate_proj", "model.layers.46.mlp.experts.43.gate_proj", "model.layers.46.mlp.experts.44.gate_proj", "model.layers.46.mlp.experts.45.gate_proj", "model.layers.46.mlp.experts.46.gate_proj", "model.layers.46.mlp.experts.47.gate_proj", "model.layers.46.mlp.experts.48.gate_proj", "model.layers.46.mlp.experts.49.gate_proj", "model.layers.46.mlp.experts.50.gate_proj", "model.layers.46.mlp.experts.51.gate_proj", "model.layers.46.mlp.experts.52.gate_proj", "model.layers.46.mlp.experts.53.gate_proj", "model.layers.46.mlp.experts.54.gate_proj", "model.layers.46.mlp.experts.55.gate_proj", "model.layers.46.mlp.experts.56.gate_proj", "model.layers.46.mlp.experts.57.gate_proj", "model.layers.46.mlp.experts.58.gate_proj", "model.layers.46.mlp.experts.59.gate_proj", "model.layers.46.mlp.experts.60.gate_proj", "model.layers.46.mlp.experts.61.gate_proj", "model.layers.46.mlp.experts.62.gate_proj", "model.layers.46.mlp.experts.63.gate_proj", "model.layers.46.mlp.experts.64.gate_proj", "model.layers.46.mlp.experts.65.gate_proj", "model.layers.46.mlp.experts.66.gate_proj", "model.layers.46.mlp.experts.67.gate_proj", "model.layers.46.mlp.experts.68.gate_proj", "model.layers.46.mlp.experts.69.gate_proj", "model.layers.46.mlp.experts.70.gate_proj", "model.layers.46.mlp.experts.71.gate_proj", "model.layers.46.mlp.experts.72.gate_proj", "model.layers.46.mlp.experts.73.gate_proj", "model.layers.46.mlp.experts.74.gate_proj", "model.layers.46.mlp.experts.75.gate_proj", "model.layers.46.mlp.experts.76.gate_proj", "model.layers.46.mlp.experts.77.gate_proj", "model.layers.46.mlp.experts.78.gate_proj", "model.layers.46.mlp.experts.79.gate_proj", "model.layers.46.mlp.experts.80.gate_proj", "model.layers.46.mlp.experts.81.gate_proj", "model.layers.46.mlp.experts.82.gate_proj", "model.layers.46.mlp.experts.83.gate_proj", "model.layers.46.mlp.experts.84.gate_proj", "model.layers.46.mlp.experts.85.gate_proj", "model.layers.46.mlp.experts.86.gate_proj", "model.layers.46.mlp.experts.87.gate_proj", "model.layers.46.mlp.experts.88.gate_proj", "model.layers.46.mlp.experts.89.gate_proj", "model.layers.46.mlp.experts.90.gate_proj", "model.layers.46.mlp.experts.91.gate_proj", "model.layers.46.mlp.experts.92.gate_proj", "model.layers.46.mlp.experts.93.gate_proj", "model.layers.46.mlp.experts.94.gate_proj", "model.layers.46.mlp.experts.95.gate_proj", "model.layers.46.mlp.experts.96.gate_proj", "model.layers.46.mlp.experts.97.gate_proj", "model.layers.46.mlp.experts.98.gate_proj", "model.layers.46.mlp.experts.99.gate_proj", "model.layers.46.mlp.experts.100.gate_proj", "model.layers.46.mlp.experts.101.gate_proj", "model.layers.46.mlp.experts.102.gate_proj", "model.layers.46.mlp.experts.103.gate_proj", "model.layers.46.mlp.experts.104.gate_proj", "model.layers.46.mlp.experts.105.gate_proj", "model.layers.46.mlp.experts.106.gate_proj", "model.layers.46.mlp.experts.107.gate_proj", "model.layers.46.mlp.experts.108.gate_proj", "model.layers.46.mlp.experts.109.gate_proj", "model.layers.46.mlp.experts.110.gate_proj", "model.layers.46.mlp.experts.111.gate_proj", "model.layers.46.mlp.experts.112.gate_proj", "model.layers.46.mlp.experts.113.gate_proj", "model.layers.46.mlp.experts.114.gate_proj", "model.layers.46.mlp.experts.115.gate_proj", "model.layers.46.mlp.experts.116.gate_proj", "model.layers.46.mlp.experts.117.gate_proj", "model.layers.46.mlp.experts.118.gate_proj", "model.layers.46.mlp.experts.119.gate_proj", "model.layers.46.mlp.experts.120.gate_proj", "model.layers.46.mlp.experts.121.gate_proj", "model.layers.46.mlp.experts.122.gate_proj", "model.layers.46.mlp.experts.123.gate_proj", "model.layers.46.mlp.experts.124.gate_proj", "model.layers.46.mlp.experts.125.gate_proj", "model.layers.46.mlp.experts.126.gate_proj", "model.layers.46.mlp.experts.127.gate_proj", "model.layers.46.mlp.experts.128.gate_proj", "model.layers.46.mlp.experts.129.gate_proj", "model.layers.46.mlp.experts.130.gate_proj", "model.layers.46.mlp.experts.131.gate_proj", "model.layers.46.mlp.experts.132.gate_proj", "model.layers.46.mlp.experts.133.gate_proj", "model.layers.46.mlp.experts.134.gate_proj", "model.layers.46.mlp.experts.135.gate_proj", "model.layers.46.mlp.experts.136.gate_proj", "model.layers.46.mlp.experts.137.gate_proj", "model.layers.46.mlp.experts.138.gate_proj", "model.layers.46.mlp.experts.139.gate_proj", "model.layers.46.mlp.experts.140.gate_proj", "model.layers.46.mlp.experts.141.gate_proj", "model.layers.46.mlp.experts.142.gate_proj", "model.layers.46.mlp.experts.143.gate_proj", "model.layers.46.mlp.experts.144.gate_proj", "model.layers.46.mlp.experts.145.gate_proj", "model.layers.46.mlp.experts.146.gate_proj", "model.layers.46.mlp.experts.147.gate_proj", "model.layers.46.mlp.experts.148.gate_proj", "model.layers.46.mlp.experts.149.gate_proj", "model.layers.46.mlp.experts.150.gate_proj", "model.layers.46.mlp.experts.151.gate_proj", "model.layers.46.mlp.experts.152.gate_proj", "model.layers.46.mlp.experts.153.gate_proj", "model.layers.46.mlp.experts.154.gate_proj", "model.layers.46.mlp.experts.155.gate_proj", "model.layers.46.mlp.experts.156.gate_proj", "model.layers.46.mlp.experts.157.gate_proj", "model.layers.46.mlp.experts.158.gate_proj", "model.layers.46.mlp.experts.159.gate_proj", "model.layers.46.mlp.experts.0.up_proj", "model.layers.46.mlp.experts.1.up_proj", "model.layers.46.mlp.experts.2.up_proj", "model.layers.46.mlp.experts.3.up_proj", "model.layers.46.mlp.experts.4.up_proj", "model.layers.46.mlp.experts.5.up_proj", "model.layers.46.mlp.experts.6.up_proj", "model.layers.46.mlp.experts.7.up_proj", "model.layers.46.mlp.experts.8.up_proj", "model.layers.46.mlp.experts.9.up_proj", "model.layers.46.mlp.experts.10.up_proj", "model.layers.46.mlp.experts.11.up_proj", "model.layers.46.mlp.experts.12.up_proj", "model.layers.46.mlp.experts.13.up_proj", "model.layers.46.mlp.experts.14.up_proj", "model.layers.46.mlp.experts.15.up_proj", "model.layers.46.mlp.experts.16.up_proj", "model.layers.46.mlp.experts.17.up_proj", "model.layers.46.mlp.experts.18.up_proj", "model.layers.46.mlp.experts.19.up_proj", "model.layers.46.mlp.experts.20.up_proj", "model.layers.46.mlp.experts.21.up_proj", "model.layers.46.mlp.experts.22.up_proj", "model.layers.46.mlp.experts.23.up_proj", "model.layers.46.mlp.experts.24.up_proj", "model.layers.46.mlp.experts.25.up_proj", "model.layers.46.mlp.experts.26.up_proj", "model.layers.46.mlp.experts.27.up_proj", "model.layers.46.mlp.experts.28.up_proj", "model.layers.46.mlp.experts.29.up_proj", "model.layers.46.mlp.experts.30.up_proj", "model.layers.46.mlp.experts.31.up_proj", "model.layers.46.mlp.experts.32.up_proj", "model.layers.46.mlp.experts.33.up_proj", "model.layers.46.mlp.experts.34.up_proj", "model.layers.46.mlp.experts.35.up_proj", "model.layers.46.mlp.experts.36.up_proj", "model.layers.46.mlp.experts.37.up_proj", "model.layers.46.mlp.experts.38.up_proj", "model.layers.46.mlp.experts.39.up_proj", "model.layers.46.mlp.experts.40.up_proj", "model.layers.46.mlp.experts.41.up_proj", "model.layers.46.mlp.experts.42.up_proj", "model.layers.46.mlp.experts.43.up_proj", "model.layers.46.mlp.experts.44.up_proj", "model.layers.46.mlp.experts.45.up_proj", "model.layers.46.mlp.experts.46.up_proj", "model.layers.46.mlp.experts.47.up_proj", "model.layers.46.mlp.experts.48.up_proj", "model.layers.46.mlp.experts.49.up_proj", "model.layers.46.mlp.experts.50.up_proj", "model.layers.46.mlp.experts.51.up_proj", "model.layers.46.mlp.experts.52.up_proj", "model.layers.46.mlp.experts.53.up_proj", "model.layers.46.mlp.experts.54.up_proj", "model.layers.46.mlp.experts.55.up_proj", "model.layers.46.mlp.experts.56.up_proj", "model.layers.46.mlp.experts.57.up_proj", "model.layers.46.mlp.experts.58.up_proj", "model.layers.46.mlp.experts.59.up_proj", "model.layers.46.mlp.experts.60.up_proj", "model.layers.46.mlp.experts.61.up_proj", "model.layers.46.mlp.experts.62.up_proj", "model.layers.46.mlp.experts.63.up_proj", "model.layers.46.mlp.experts.64.up_proj", "model.layers.46.mlp.experts.65.up_proj", "model.layers.46.mlp.experts.66.up_proj", "model.layers.46.mlp.experts.67.up_proj", "model.layers.46.mlp.experts.68.up_proj", "model.layers.46.mlp.experts.69.up_proj", "model.layers.46.mlp.experts.70.up_proj", "model.layers.46.mlp.experts.71.up_proj", "model.layers.46.mlp.experts.72.up_proj", "model.layers.46.mlp.experts.73.up_proj", "model.layers.46.mlp.experts.74.up_proj", "model.layers.46.mlp.experts.75.up_proj", "model.layers.46.mlp.experts.76.up_proj", "model.layers.46.mlp.experts.77.up_proj", "model.layers.46.mlp.experts.78.up_proj", "model.layers.46.mlp.experts.79.up_proj", "model.layers.46.mlp.experts.80.up_proj", "model.layers.46.mlp.experts.81.up_proj", "model.layers.46.mlp.experts.82.up_proj", "model.layers.46.mlp.experts.83.up_proj", "model.layers.46.mlp.experts.84.up_proj", "model.layers.46.mlp.experts.85.up_proj", "model.layers.46.mlp.experts.86.up_proj", "model.layers.46.mlp.experts.87.up_proj", "model.layers.46.mlp.experts.88.up_proj", "model.layers.46.mlp.experts.89.up_proj", "model.layers.46.mlp.experts.90.up_proj", "model.layers.46.mlp.experts.91.up_proj", "model.layers.46.mlp.experts.92.up_proj", "model.layers.46.mlp.experts.93.up_proj", "model.layers.46.mlp.experts.94.up_proj", "model.layers.46.mlp.experts.95.up_proj", "model.layers.46.mlp.experts.96.up_proj", "model.layers.46.mlp.experts.97.up_proj", "model.layers.46.mlp.experts.98.up_proj", "model.layers.46.mlp.experts.99.up_proj", "model.layers.46.mlp.experts.100.up_proj", "model.layers.46.mlp.experts.101.up_proj", "model.layers.46.mlp.experts.102.up_proj", "model.layers.46.mlp.experts.103.up_proj", "model.layers.46.mlp.experts.104.up_proj", "model.layers.46.mlp.experts.105.up_proj", "model.layers.46.mlp.experts.106.up_proj", "model.layers.46.mlp.experts.107.up_proj", "model.layers.46.mlp.experts.108.up_proj", "model.layers.46.mlp.experts.109.up_proj", "model.layers.46.mlp.experts.110.up_proj", "model.layers.46.mlp.experts.111.up_proj", "model.layers.46.mlp.experts.112.up_proj", "model.layers.46.mlp.experts.113.up_proj", "model.layers.46.mlp.experts.114.up_proj", "model.layers.46.mlp.experts.115.up_proj", "model.layers.46.mlp.experts.116.up_proj", "model.layers.46.mlp.experts.117.up_proj", "model.layers.46.mlp.experts.118.up_proj", "model.layers.46.mlp.experts.119.up_proj", "model.layers.46.mlp.experts.120.up_proj", "model.layers.46.mlp.experts.121.up_proj", "model.layers.46.mlp.experts.122.up_proj", "model.layers.46.mlp.experts.123.up_proj", "model.layers.46.mlp.experts.124.up_proj", "model.layers.46.mlp.experts.125.up_proj", "model.layers.46.mlp.experts.126.up_proj", "model.layers.46.mlp.experts.127.up_proj", "model.layers.46.mlp.experts.128.up_proj", "model.layers.46.mlp.experts.129.up_proj", "model.layers.46.mlp.experts.130.up_proj", "model.layers.46.mlp.experts.131.up_proj", "model.layers.46.mlp.experts.132.up_proj", "model.layers.46.mlp.experts.133.up_proj", "model.layers.46.mlp.experts.134.up_proj", "model.layers.46.mlp.experts.135.up_proj", "model.layers.46.mlp.experts.136.up_proj", "model.layers.46.mlp.experts.137.up_proj", "model.layers.46.mlp.experts.138.up_proj", "model.layers.46.mlp.experts.139.up_proj", "model.layers.46.mlp.experts.140.up_proj", "model.layers.46.mlp.experts.141.up_proj", "model.layers.46.mlp.experts.142.up_proj", "model.layers.46.mlp.experts.143.up_proj", "model.layers.46.mlp.experts.144.up_proj", "model.layers.46.mlp.experts.145.up_proj", "model.layers.46.mlp.experts.146.up_proj", "model.layers.46.mlp.experts.147.up_proj", "model.layers.46.mlp.experts.148.up_proj", "model.layers.46.mlp.experts.149.up_proj", "model.layers.46.mlp.experts.150.up_proj", "model.layers.46.mlp.experts.151.up_proj", "model.layers.46.mlp.experts.152.up_proj", "model.layers.46.mlp.experts.153.up_proj", "model.layers.46.mlp.experts.154.up_proj", "model.layers.46.mlp.experts.155.up_proj", "model.layers.46.mlp.experts.156.up_proj", "model.layers.46.mlp.experts.157.up_proj", "model.layers.46.mlp.experts.158.up_proj", "model.layers.46.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.1581694707274437e-05, "dbits": 2516582400 }, { "dkld": -2.9301131144165646e-05, "dbits": 5033164800 } ] }, { "idx": 278, "layers": [ "model.layers.46.mlp.experts.0.down_proj", "model.layers.46.mlp.experts.1.down_proj", "model.layers.46.mlp.experts.2.down_proj", "model.layers.46.mlp.experts.3.down_proj", "model.layers.46.mlp.experts.4.down_proj", "model.layers.46.mlp.experts.5.down_proj", "model.layers.46.mlp.experts.6.down_proj", "model.layers.46.mlp.experts.7.down_proj", "model.layers.46.mlp.experts.8.down_proj", "model.layers.46.mlp.experts.9.down_proj", "model.layers.46.mlp.experts.10.down_proj", "model.layers.46.mlp.experts.11.down_proj", "model.layers.46.mlp.experts.12.down_proj", "model.layers.46.mlp.experts.13.down_proj", "model.layers.46.mlp.experts.14.down_proj", "model.layers.46.mlp.experts.15.down_proj", "model.layers.46.mlp.experts.16.down_proj", "model.layers.46.mlp.experts.17.down_proj", "model.layers.46.mlp.experts.18.down_proj", "model.layers.46.mlp.experts.19.down_proj", "model.layers.46.mlp.experts.20.down_proj", "model.layers.46.mlp.experts.21.down_proj", "model.layers.46.mlp.experts.22.down_proj", "model.layers.46.mlp.experts.23.down_proj", "model.layers.46.mlp.experts.24.down_proj", "model.layers.46.mlp.experts.25.down_proj", "model.layers.46.mlp.experts.26.down_proj", "model.layers.46.mlp.experts.27.down_proj", "model.layers.46.mlp.experts.28.down_proj", "model.layers.46.mlp.experts.29.down_proj", "model.layers.46.mlp.experts.30.down_proj", "model.layers.46.mlp.experts.31.down_proj", "model.layers.46.mlp.experts.32.down_proj", "model.layers.46.mlp.experts.33.down_proj", "model.layers.46.mlp.experts.34.down_proj", "model.layers.46.mlp.experts.35.down_proj", "model.layers.46.mlp.experts.36.down_proj", "model.layers.46.mlp.experts.37.down_proj", "model.layers.46.mlp.experts.38.down_proj", "model.layers.46.mlp.experts.39.down_proj", "model.layers.46.mlp.experts.40.down_proj", "model.layers.46.mlp.experts.41.down_proj", "model.layers.46.mlp.experts.42.down_proj", "model.layers.46.mlp.experts.43.down_proj", "model.layers.46.mlp.experts.44.down_proj", "model.layers.46.mlp.experts.45.down_proj", "model.layers.46.mlp.experts.46.down_proj", "model.layers.46.mlp.experts.47.down_proj", "model.layers.46.mlp.experts.48.down_proj", "model.layers.46.mlp.experts.49.down_proj", "model.layers.46.mlp.experts.50.down_proj", "model.layers.46.mlp.experts.51.down_proj", "model.layers.46.mlp.experts.52.down_proj", "model.layers.46.mlp.experts.53.down_proj", "model.layers.46.mlp.experts.54.down_proj", "model.layers.46.mlp.experts.55.down_proj", "model.layers.46.mlp.experts.56.down_proj", "model.layers.46.mlp.experts.57.down_proj", "model.layers.46.mlp.experts.58.down_proj", "model.layers.46.mlp.experts.59.down_proj", "model.layers.46.mlp.experts.60.down_proj", "model.layers.46.mlp.experts.61.down_proj", "model.layers.46.mlp.experts.62.down_proj", "model.layers.46.mlp.experts.63.down_proj", "model.layers.46.mlp.experts.64.down_proj", "model.layers.46.mlp.experts.65.down_proj", "model.layers.46.mlp.experts.66.down_proj", "model.layers.46.mlp.experts.67.down_proj", "model.layers.46.mlp.experts.68.down_proj", "model.layers.46.mlp.experts.69.down_proj", "model.layers.46.mlp.experts.70.down_proj", "model.layers.46.mlp.experts.71.down_proj", "model.layers.46.mlp.experts.72.down_proj", "model.layers.46.mlp.experts.73.down_proj", "model.layers.46.mlp.experts.74.down_proj", "model.layers.46.mlp.experts.75.down_proj", "model.layers.46.mlp.experts.76.down_proj", "model.layers.46.mlp.experts.77.down_proj", "model.layers.46.mlp.experts.78.down_proj", "model.layers.46.mlp.experts.79.down_proj", "model.layers.46.mlp.experts.80.down_proj", "model.layers.46.mlp.experts.81.down_proj", "model.layers.46.mlp.experts.82.down_proj", "model.layers.46.mlp.experts.83.down_proj", "model.layers.46.mlp.experts.84.down_proj", "model.layers.46.mlp.experts.85.down_proj", "model.layers.46.mlp.experts.86.down_proj", "model.layers.46.mlp.experts.87.down_proj", "model.layers.46.mlp.experts.88.down_proj", "model.layers.46.mlp.experts.89.down_proj", "model.layers.46.mlp.experts.90.down_proj", "model.layers.46.mlp.experts.91.down_proj", "model.layers.46.mlp.experts.92.down_proj", "model.layers.46.mlp.experts.93.down_proj", "model.layers.46.mlp.experts.94.down_proj", "model.layers.46.mlp.experts.95.down_proj", "model.layers.46.mlp.experts.96.down_proj", "model.layers.46.mlp.experts.97.down_proj", "model.layers.46.mlp.experts.98.down_proj", "model.layers.46.mlp.experts.99.down_proj", "model.layers.46.mlp.experts.100.down_proj", "model.layers.46.mlp.experts.101.down_proj", "model.layers.46.mlp.experts.102.down_proj", "model.layers.46.mlp.experts.103.down_proj", "model.layers.46.mlp.experts.104.down_proj", "model.layers.46.mlp.experts.105.down_proj", "model.layers.46.mlp.experts.106.down_proj", "model.layers.46.mlp.experts.107.down_proj", "model.layers.46.mlp.experts.108.down_proj", "model.layers.46.mlp.experts.109.down_proj", "model.layers.46.mlp.experts.110.down_proj", "model.layers.46.mlp.experts.111.down_proj", "model.layers.46.mlp.experts.112.down_proj", "model.layers.46.mlp.experts.113.down_proj", "model.layers.46.mlp.experts.114.down_proj", "model.layers.46.mlp.experts.115.down_proj", "model.layers.46.mlp.experts.116.down_proj", "model.layers.46.mlp.experts.117.down_proj", "model.layers.46.mlp.experts.118.down_proj", "model.layers.46.mlp.experts.119.down_proj", "model.layers.46.mlp.experts.120.down_proj", "model.layers.46.mlp.experts.121.down_proj", "model.layers.46.mlp.experts.122.down_proj", "model.layers.46.mlp.experts.123.down_proj", "model.layers.46.mlp.experts.124.down_proj", "model.layers.46.mlp.experts.125.down_proj", "model.layers.46.mlp.experts.126.down_proj", "model.layers.46.mlp.experts.127.down_proj", "model.layers.46.mlp.experts.128.down_proj", "model.layers.46.mlp.experts.129.down_proj", "model.layers.46.mlp.experts.130.down_proj", "model.layers.46.mlp.experts.131.down_proj", "model.layers.46.mlp.experts.132.down_proj", "model.layers.46.mlp.experts.133.down_proj", "model.layers.46.mlp.experts.134.down_proj", "model.layers.46.mlp.experts.135.down_proj", "model.layers.46.mlp.experts.136.down_proj", "model.layers.46.mlp.experts.137.down_proj", "model.layers.46.mlp.experts.138.down_proj", "model.layers.46.mlp.experts.139.down_proj", "model.layers.46.mlp.experts.140.down_proj", "model.layers.46.mlp.experts.141.down_proj", "model.layers.46.mlp.experts.142.down_proj", "model.layers.46.mlp.experts.143.down_proj", "model.layers.46.mlp.experts.144.down_proj", "model.layers.46.mlp.experts.145.down_proj", "model.layers.46.mlp.experts.146.down_proj", "model.layers.46.mlp.experts.147.down_proj", "model.layers.46.mlp.experts.148.down_proj", "model.layers.46.mlp.experts.149.down_proj", "model.layers.46.mlp.experts.150.down_proj", "model.layers.46.mlp.experts.151.down_proj", "model.layers.46.mlp.experts.152.down_proj", "model.layers.46.mlp.experts.153.down_proj", "model.layers.46.mlp.experts.154.down_proj", "model.layers.46.mlp.experts.155.down_proj", "model.layers.46.mlp.experts.156.down_proj", "model.layers.46.mlp.experts.157.down_proj", "model.layers.46.mlp.experts.158.down_proj", "model.layers.46.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 3.306646831333776e-05, "dbits": 1258291200 }, { "dkld": -3.922567702829144e-06, "dbits": 2516582400 } ] }, { "idx": 279, "layers": [ "model.layers.47.self_attn.q_proj" ], "candidates": [ { "dkld": -6.6359760239713406e-06, "dbits": 62914560 }, { "dkld": 1.5388615429401745e-05, "dbits": 125829120 } ] }, { "idx": 280, "layers": [ "model.layers.47.self_attn.k_proj", "model.layers.47.self_attn.v_proj" ], "candidates": [ { "dkld": 5.879658274352689e-05, "dbits": 10485760 }, { "dkld": 2.208568621426925e-05, "dbits": 20971520 } ] }, { "idx": 281, "layers": [ "model.layers.47.self_attn.o_proj" ], "candidates": [ { "dkld": -5.097703542560235e-05, "dbits": 62914560 }, { "dkld": -2.1954928524791154e-05, "dbits": 125829120 } ] }, { "idx": 282, "layers": [ "model.layers.47.mlp.shared_experts.gate_proj", "model.layers.47.mlp.shared_experts.up_proj", "model.layers.47.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -3.056719433516125e-05, "dbits": 23592960 }, { "dkld": -2.976756077259675e-05, "dbits": 47185920 } ] }, { "idx": 283, "layers": [ "model.layers.47.mlp.experts.0.gate_proj", "model.layers.47.mlp.experts.1.gate_proj", "model.layers.47.mlp.experts.2.gate_proj", "model.layers.47.mlp.experts.3.gate_proj", "model.layers.47.mlp.experts.4.gate_proj", "model.layers.47.mlp.experts.5.gate_proj", "model.layers.47.mlp.experts.6.gate_proj", "model.layers.47.mlp.experts.7.gate_proj", "model.layers.47.mlp.experts.8.gate_proj", "model.layers.47.mlp.experts.9.gate_proj", "model.layers.47.mlp.experts.10.gate_proj", "model.layers.47.mlp.experts.11.gate_proj", "model.layers.47.mlp.experts.12.gate_proj", "model.layers.47.mlp.experts.13.gate_proj", "model.layers.47.mlp.experts.14.gate_proj", "model.layers.47.mlp.experts.15.gate_proj", "model.layers.47.mlp.experts.16.gate_proj", "model.layers.47.mlp.experts.17.gate_proj", "model.layers.47.mlp.experts.18.gate_proj", "model.layers.47.mlp.experts.19.gate_proj", "model.layers.47.mlp.experts.20.gate_proj", "model.layers.47.mlp.experts.21.gate_proj", "model.layers.47.mlp.experts.22.gate_proj", "model.layers.47.mlp.experts.23.gate_proj", "model.layers.47.mlp.experts.24.gate_proj", "model.layers.47.mlp.experts.25.gate_proj", "model.layers.47.mlp.experts.26.gate_proj", "model.layers.47.mlp.experts.27.gate_proj", "model.layers.47.mlp.experts.28.gate_proj", "model.layers.47.mlp.experts.29.gate_proj", "model.layers.47.mlp.experts.30.gate_proj", "model.layers.47.mlp.experts.31.gate_proj", "model.layers.47.mlp.experts.32.gate_proj", "model.layers.47.mlp.experts.33.gate_proj", "model.layers.47.mlp.experts.34.gate_proj", "model.layers.47.mlp.experts.35.gate_proj", "model.layers.47.mlp.experts.36.gate_proj", "model.layers.47.mlp.experts.37.gate_proj", "model.layers.47.mlp.experts.38.gate_proj", "model.layers.47.mlp.experts.39.gate_proj", "model.layers.47.mlp.experts.40.gate_proj", "model.layers.47.mlp.experts.41.gate_proj", "model.layers.47.mlp.experts.42.gate_proj", "model.layers.47.mlp.experts.43.gate_proj", "model.layers.47.mlp.experts.44.gate_proj", "model.layers.47.mlp.experts.45.gate_proj", "model.layers.47.mlp.experts.46.gate_proj", "model.layers.47.mlp.experts.47.gate_proj", "model.layers.47.mlp.experts.48.gate_proj", "model.layers.47.mlp.experts.49.gate_proj", "model.layers.47.mlp.experts.50.gate_proj", "model.layers.47.mlp.experts.51.gate_proj", "model.layers.47.mlp.experts.52.gate_proj", "model.layers.47.mlp.experts.53.gate_proj", "model.layers.47.mlp.experts.54.gate_proj", "model.layers.47.mlp.experts.55.gate_proj", "model.layers.47.mlp.experts.56.gate_proj", "model.layers.47.mlp.experts.57.gate_proj", "model.layers.47.mlp.experts.58.gate_proj", "model.layers.47.mlp.experts.59.gate_proj", "model.layers.47.mlp.experts.60.gate_proj", "model.layers.47.mlp.experts.61.gate_proj", "model.layers.47.mlp.experts.62.gate_proj", "model.layers.47.mlp.experts.63.gate_proj", "model.layers.47.mlp.experts.64.gate_proj", "model.layers.47.mlp.experts.65.gate_proj", "model.layers.47.mlp.experts.66.gate_proj", "model.layers.47.mlp.experts.67.gate_proj", "model.layers.47.mlp.experts.68.gate_proj", "model.layers.47.mlp.experts.69.gate_proj", "model.layers.47.mlp.experts.70.gate_proj", "model.layers.47.mlp.experts.71.gate_proj", "model.layers.47.mlp.experts.72.gate_proj", "model.layers.47.mlp.experts.73.gate_proj", "model.layers.47.mlp.experts.74.gate_proj", "model.layers.47.mlp.experts.75.gate_proj", "model.layers.47.mlp.experts.76.gate_proj", "model.layers.47.mlp.experts.77.gate_proj", "model.layers.47.mlp.experts.78.gate_proj", "model.layers.47.mlp.experts.79.gate_proj", "model.layers.47.mlp.experts.80.gate_proj", "model.layers.47.mlp.experts.81.gate_proj", "model.layers.47.mlp.experts.82.gate_proj", "model.layers.47.mlp.experts.83.gate_proj", "model.layers.47.mlp.experts.84.gate_proj", "model.layers.47.mlp.experts.85.gate_proj", "model.layers.47.mlp.experts.86.gate_proj", "model.layers.47.mlp.experts.87.gate_proj", "model.layers.47.mlp.experts.88.gate_proj", "model.layers.47.mlp.experts.89.gate_proj", "model.layers.47.mlp.experts.90.gate_proj", "model.layers.47.mlp.experts.91.gate_proj", "model.layers.47.mlp.experts.92.gate_proj", "model.layers.47.mlp.experts.93.gate_proj", "model.layers.47.mlp.experts.94.gate_proj", "model.layers.47.mlp.experts.95.gate_proj", "model.layers.47.mlp.experts.96.gate_proj", "model.layers.47.mlp.experts.97.gate_proj", "model.layers.47.mlp.experts.98.gate_proj", "model.layers.47.mlp.experts.99.gate_proj", "model.layers.47.mlp.experts.100.gate_proj", "model.layers.47.mlp.experts.101.gate_proj", "model.layers.47.mlp.experts.102.gate_proj", "model.layers.47.mlp.experts.103.gate_proj", "model.layers.47.mlp.experts.104.gate_proj", "model.layers.47.mlp.experts.105.gate_proj", "model.layers.47.mlp.experts.106.gate_proj", "model.layers.47.mlp.experts.107.gate_proj", "model.layers.47.mlp.experts.108.gate_proj", "model.layers.47.mlp.experts.109.gate_proj", "model.layers.47.mlp.experts.110.gate_proj", "model.layers.47.mlp.experts.111.gate_proj", "model.layers.47.mlp.experts.112.gate_proj", "model.layers.47.mlp.experts.113.gate_proj", "model.layers.47.mlp.experts.114.gate_proj", "model.layers.47.mlp.experts.115.gate_proj", "model.layers.47.mlp.experts.116.gate_proj", "model.layers.47.mlp.experts.117.gate_proj", "model.layers.47.mlp.experts.118.gate_proj", "model.layers.47.mlp.experts.119.gate_proj", "model.layers.47.mlp.experts.120.gate_proj", "model.layers.47.mlp.experts.121.gate_proj", "model.layers.47.mlp.experts.122.gate_proj", "model.layers.47.mlp.experts.123.gate_proj", "model.layers.47.mlp.experts.124.gate_proj", "model.layers.47.mlp.experts.125.gate_proj", "model.layers.47.mlp.experts.126.gate_proj", "model.layers.47.mlp.experts.127.gate_proj", "model.layers.47.mlp.experts.128.gate_proj", "model.layers.47.mlp.experts.129.gate_proj", "model.layers.47.mlp.experts.130.gate_proj", "model.layers.47.mlp.experts.131.gate_proj", "model.layers.47.mlp.experts.132.gate_proj", "model.layers.47.mlp.experts.133.gate_proj", "model.layers.47.mlp.experts.134.gate_proj", "model.layers.47.mlp.experts.135.gate_proj", "model.layers.47.mlp.experts.136.gate_proj", "model.layers.47.mlp.experts.137.gate_proj", "model.layers.47.mlp.experts.138.gate_proj", "model.layers.47.mlp.experts.139.gate_proj", "model.layers.47.mlp.experts.140.gate_proj", "model.layers.47.mlp.experts.141.gate_proj", "model.layers.47.mlp.experts.142.gate_proj", "model.layers.47.mlp.experts.143.gate_proj", "model.layers.47.mlp.experts.144.gate_proj", "model.layers.47.mlp.experts.145.gate_proj", "model.layers.47.mlp.experts.146.gate_proj", "model.layers.47.mlp.experts.147.gate_proj", "model.layers.47.mlp.experts.148.gate_proj", "model.layers.47.mlp.experts.149.gate_proj", "model.layers.47.mlp.experts.150.gate_proj", "model.layers.47.mlp.experts.151.gate_proj", "model.layers.47.mlp.experts.152.gate_proj", "model.layers.47.mlp.experts.153.gate_proj", "model.layers.47.mlp.experts.154.gate_proj", "model.layers.47.mlp.experts.155.gate_proj", "model.layers.47.mlp.experts.156.gate_proj", "model.layers.47.mlp.experts.157.gate_proj", "model.layers.47.mlp.experts.158.gate_proj", "model.layers.47.mlp.experts.159.gate_proj", "model.layers.47.mlp.experts.0.up_proj", "model.layers.47.mlp.experts.1.up_proj", "model.layers.47.mlp.experts.2.up_proj", "model.layers.47.mlp.experts.3.up_proj", "model.layers.47.mlp.experts.4.up_proj", "model.layers.47.mlp.experts.5.up_proj", "model.layers.47.mlp.experts.6.up_proj", "model.layers.47.mlp.experts.7.up_proj", "model.layers.47.mlp.experts.8.up_proj", "model.layers.47.mlp.experts.9.up_proj", "model.layers.47.mlp.experts.10.up_proj", "model.layers.47.mlp.experts.11.up_proj", "model.layers.47.mlp.experts.12.up_proj", "model.layers.47.mlp.experts.13.up_proj", "model.layers.47.mlp.experts.14.up_proj", "model.layers.47.mlp.experts.15.up_proj", "model.layers.47.mlp.experts.16.up_proj", "model.layers.47.mlp.experts.17.up_proj", "model.layers.47.mlp.experts.18.up_proj", "model.layers.47.mlp.experts.19.up_proj", "model.layers.47.mlp.experts.20.up_proj", "model.layers.47.mlp.experts.21.up_proj", "model.layers.47.mlp.experts.22.up_proj", "model.layers.47.mlp.experts.23.up_proj", "model.layers.47.mlp.experts.24.up_proj", "model.layers.47.mlp.experts.25.up_proj", "model.layers.47.mlp.experts.26.up_proj", "model.layers.47.mlp.experts.27.up_proj", "model.layers.47.mlp.experts.28.up_proj", "model.layers.47.mlp.experts.29.up_proj", "model.layers.47.mlp.experts.30.up_proj", "model.layers.47.mlp.experts.31.up_proj", "model.layers.47.mlp.experts.32.up_proj", "model.layers.47.mlp.experts.33.up_proj", "model.layers.47.mlp.experts.34.up_proj", "model.layers.47.mlp.experts.35.up_proj", "model.layers.47.mlp.experts.36.up_proj", "model.layers.47.mlp.experts.37.up_proj", "model.layers.47.mlp.experts.38.up_proj", "model.layers.47.mlp.experts.39.up_proj", "model.layers.47.mlp.experts.40.up_proj", "model.layers.47.mlp.experts.41.up_proj", "model.layers.47.mlp.experts.42.up_proj", "model.layers.47.mlp.experts.43.up_proj", "model.layers.47.mlp.experts.44.up_proj", "model.layers.47.mlp.experts.45.up_proj", "model.layers.47.mlp.experts.46.up_proj", "model.layers.47.mlp.experts.47.up_proj", "model.layers.47.mlp.experts.48.up_proj", "model.layers.47.mlp.experts.49.up_proj", "model.layers.47.mlp.experts.50.up_proj", "model.layers.47.mlp.experts.51.up_proj", "model.layers.47.mlp.experts.52.up_proj", "model.layers.47.mlp.experts.53.up_proj", "model.layers.47.mlp.experts.54.up_proj", "model.layers.47.mlp.experts.55.up_proj", "model.layers.47.mlp.experts.56.up_proj", "model.layers.47.mlp.experts.57.up_proj", "model.layers.47.mlp.experts.58.up_proj", "model.layers.47.mlp.experts.59.up_proj", "model.layers.47.mlp.experts.60.up_proj", "model.layers.47.mlp.experts.61.up_proj", "model.layers.47.mlp.experts.62.up_proj", "model.layers.47.mlp.experts.63.up_proj", "model.layers.47.mlp.experts.64.up_proj", "model.layers.47.mlp.experts.65.up_proj", "model.layers.47.mlp.experts.66.up_proj", "model.layers.47.mlp.experts.67.up_proj", "model.layers.47.mlp.experts.68.up_proj", "model.layers.47.mlp.experts.69.up_proj", "model.layers.47.mlp.experts.70.up_proj", "model.layers.47.mlp.experts.71.up_proj", "model.layers.47.mlp.experts.72.up_proj", "model.layers.47.mlp.experts.73.up_proj", "model.layers.47.mlp.experts.74.up_proj", "model.layers.47.mlp.experts.75.up_proj", "model.layers.47.mlp.experts.76.up_proj", "model.layers.47.mlp.experts.77.up_proj", "model.layers.47.mlp.experts.78.up_proj", "model.layers.47.mlp.experts.79.up_proj", "model.layers.47.mlp.experts.80.up_proj", "model.layers.47.mlp.experts.81.up_proj", "model.layers.47.mlp.experts.82.up_proj", "model.layers.47.mlp.experts.83.up_proj", "model.layers.47.mlp.experts.84.up_proj", "model.layers.47.mlp.experts.85.up_proj", "model.layers.47.mlp.experts.86.up_proj", "model.layers.47.mlp.experts.87.up_proj", "model.layers.47.mlp.experts.88.up_proj", "model.layers.47.mlp.experts.89.up_proj", "model.layers.47.mlp.experts.90.up_proj", "model.layers.47.mlp.experts.91.up_proj", "model.layers.47.mlp.experts.92.up_proj", "model.layers.47.mlp.experts.93.up_proj", "model.layers.47.mlp.experts.94.up_proj", "model.layers.47.mlp.experts.95.up_proj", "model.layers.47.mlp.experts.96.up_proj", "model.layers.47.mlp.experts.97.up_proj", "model.layers.47.mlp.experts.98.up_proj", "model.layers.47.mlp.experts.99.up_proj", "model.layers.47.mlp.experts.100.up_proj", "model.layers.47.mlp.experts.101.up_proj", "model.layers.47.mlp.experts.102.up_proj", "model.layers.47.mlp.experts.103.up_proj", "model.layers.47.mlp.experts.104.up_proj", "model.layers.47.mlp.experts.105.up_proj", "model.layers.47.mlp.experts.106.up_proj", "model.layers.47.mlp.experts.107.up_proj", "model.layers.47.mlp.experts.108.up_proj", "model.layers.47.mlp.experts.109.up_proj", "model.layers.47.mlp.experts.110.up_proj", "model.layers.47.mlp.experts.111.up_proj", "model.layers.47.mlp.experts.112.up_proj", "model.layers.47.mlp.experts.113.up_proj", "model.layers.47.mlp.experts.114.up_proj", "model.layers.47.mlp.experts.115.up_proj", "model.layers.47.mlp.experts.116.up_proj", "model.layers.47.mlp.experts.117.up_proj", "model.layers.47.mlp.experts.118.up_proj", "model.layers.47.mlp.experts.119.up_proj", "model.layers.47.mlp.experts.120.up_proj", "model.layers.47.mlp.experts.121.up_proj", "model.layers.47.mlp.experts.122.up_proj", "model.layers.47.mlp.experts.123.up_proj", "model.layers.47.mlp.experts.124.up_proj", "model.layers.47.mlp.experts.125.up_proj", "model.layers.47.mlp.experts.126.up_proj", "model.layers.47.mlp.experts.127.up_proj", "model.layers.47.mlp.experts.128.up_proj", "model.layers.47.mlp.experts.129.up_proj", "model.layers.47.mlp.experts.130.up_proj", "model.layers.47.mlp.experts.131.up_proj", "model.layers.47.mlp.experts.132.up_proj", "model.layers.47.mlp.experts.133.up_proj", "model.layers.47.mlp.experts.134.up_proj", "model.layers.47.mlp.experts.135.up_proj", "model.layers.47.mlp.experts.136.up_proj", "model.layers.47.mlp.experts.137.up_proj", "model.layers.47.mlp.experts.138.up_proj", "model.layers.47.mlp.experts.139.up_proj", "model.layers.47.mlp.experts.140.up_proj", "model.layers.47.mlp.experts.141.up_proj", "model.layers.47.mlp.experts.142.up_proj", "model.layers.47.mlp.experts.143.up_proj", "model.layers.47.mlp.experts.144.up_proj", "model.layers.47.mlp.experts.145.up_proj", "model.layers.47.mlp.experts.146.up_proj", "model.layers.47.mlp.experts.147.up_proj", "model.layers.47.mlp.experts.148.up_proj", "model.layers.47.mlp.experts.149.up_proj", "model.layers.47.mlp.experts.150.up_proj", "model.layers.47.mlp.experts.151.up_proj", "model.layers.47.mlp.experts.152.up_proj", "model.layers.47.mlp.experts.153.up_proj", "model.layers.47.mlp.experts.154.up_proj", "model.layers.47.mlp.experts.155.up_proj", "model.layers.47.mlp.experts.156.up_proj", "model.layers.47.mlp.experts.157.up_proj", "model.layers.47.mlp.experts.158.up_proj", "model.layers.47.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.9520381465555625e-05, "dbits": 2516582400 }, { "dkld": -2.7865637093772017e-06, "dbits": 5033164800 } ] }, { "idx": 284, "layers": [ "model.layers.47.mlp.experts.0.down_proj", "model.layers.47.mlp.experts.1.down_proj", "model.layers.47.mlp.experts.2.down_proj", "model.layers.47.mlp.experts.3.down_proj", "model.layers.47.mlp.experts.4.down_proj", "model.layers.47.mlp.experts.5.down_proj", "model.layers.47.mlp.experts.6.down_proj", "model.layers.47.mlp.experts.7.down_proj", "model.layers.47.mlp.experts.8.down_proj", "model.layers.47.mlp.experts.9.down_proj", "model.layers.47.mlp.experts.10.down_proj", "model.layers.47.mlp.experts.11.down_proj", "model.layers.47.mlp.experts.12.down_proj", "model.layers.47.mlp.experts.13.down_proj", "model.layers.47.mlp.experts.14.down_proj", "model.layers.47.mlp.experts.15.down_proj", "model.layers.47.mlp.experts.16.down_proj", "model.layers.47.mlp.experts.17.down_proj", "model.layers.47.mlp.experts.18.down_proj", "model.layers.47.mlp.experts.19.down_proj", "model.layers.47.mlp.experts.20.down_proj", "model.layers.47.mlp.experts.21.down_proj", "model.layers.47.mlp.experts.22.down_proj", "model.layers.47.mlp.experts.23.down_proj", "model.layers.47.mlp.experts.24.down_proj", "model.layers.47.mlp.experts.25.down_proj", "model.layers.47.mlp.experts.26.down_proj", "model.layers.47.mlp.experts.27.down_proj", "model.layers.47.mlp.experts.28.down_proj", "model.layers.47.mlp.experts.29.down_proj", "model.layers.47.mlp.experts.30.down_proj", "model.layers.47.mlp.experts.31.down_proj", "model.layers.47.mlp.experts.32.down_proj", "model.layers.47.mlp.experts.33.down_proj", "model.layers.47.mlp.experts.34.down_proj", "model.layers.47.mlp.experts.35.down_proj", "model.layers.47.mlp.experts.36.down_proj", "model.layers.47.mlp.experts.37.down_proj", "model.layers.47.mlp.experts.38.down_proj", "model.layers.47.mlp.experts.39.down_proj", "model.layers.47.mlp.experts.40.down_proj", "model.layers.47.mlp.experts.41.down_proj", "model.layers.47.mlp.experts.42.down_proj", "model.layers.47.mlp.experts.43.down_proj", "model.layers.47.mlp.experts.44.down_proj", "model.layers.47.mlp.experts.45.down_proj", "model.layers.47.mlp.experts.46.down_proj", "model.layers.47.mlp.experts.47.down_proj", "model.layers.47.mlp.experts.48.down_proj", "model.layers.47.mlp.experts.49.down_proj", "model.layers.47.mlp.experts.50.down_proj", "model.layers.47.mlp.experts.51.down_proj", "model.layers.47.mlp.experts.52.down_proj", "model.layers.47.mlp.experts.53.down_proj", "model.layers.47.mlp.experts.54.down_proj", "model.layers.47.mlp.experts.55.down_proj", "model.layers.47.mlp.experts.56.down_proj", "model.layers.47.mlp.experts.57.down_proj", "model.layers.47.mlp.experts.58.down_proj", "model.layers.47.mlp.experts.59.down_proj", "model.layers.47.mlp.experts.60.down_proj", "model.layers.47.mlp.experts.61.down_proj", "model.layers.47.mlp.experts.62.down_proj", "model.layers.47.mlp.experts.63.down_proj", "model.layers.47.mlp.experts.64.down_proj", "model.layers.47.mlp.experts.65.down_proj", "model.layers.47.mlp.experts.66.down_proj", "model.layers.47.mlp.experts.67.down_proj", "model.layers.47.mlp.experts.68.down_proj", "model.layers.47.mlp.experts.69.down_proj", "model.layers.47.mlp.experts.70.down_proj", "model.layers.47.mlp.experts.71.down_proj", "model.layers.47.mlp.experts.72.down_proj", "model.layers.47.mlp.experts.73.down_proj", "model.layers.47.mlp.experts.74.down_proj", "model.layers.47.mlp.experts.75.down_proj", "model.layers.47.mlp.experts.76.down_proj", "model.layers.47.mlp.experts.77.down_proj", "model.layers.47.mlp.experts.78.down_proj", "model.layers.47.mlp.experts.79.down_proj", "model.layers.47.mlp.experts.80.down_proj", "model.layers.47.mlp.experts.81.down_proj", "model.layers.47.mlp.experts.82.down_proj", "model.layers.47.mlp.experts.83.down_proj", "model.layers.47.mlp.experts.84.down_proj", "model.layers.47.mlp.experts.85.down_proj", "model.layers.47.mlp.experts.86.down_proj", "model.layers.47.mlp.experts.87.down_proj", "model.layers.47.mlp.experts.88.down_proj", "model.layers.47.mlp.experts.89.down_proj", "model.layers.47.mlp.experts.90.down_proj", "model.layers.47.mlp.experts.91.down_proj", "model.layers.47.mlp.experts.92.down_proj", "model.layers.47.mlp.experts.93.down_proj", "model.layers.47.mlp.experts.94.down_proj", "model.layers.47.mlp.experts.95.down_proj", "model.layers.47.mlp.experts.96.down_proj", "model.layers.47.mlp.experts.97.down_proj", "model.layers.47.mlp.experts.98.down_proj", "model.layers.47.mlp.experts.99.down_proj", "model.layers.47.mlp.experts.100.down_proj", "model.layers.47.mlp.experts.101.down_proj", "model.layers.47.mlp.experts.102.down_proj", "model.layers.47.mlp.experts.103.down_proj", "model.layers.47.mlp.experts.104.down_proj", "model.layers.47.mlp.experts.105.down_proj", "model.layers.47.mlp.experts.106.down_proj", "model.layers.47.mlp.experts.107.down_proj", "model.layers.47.mlp.experts.108.down_proj", "model.layers.47.mlp.experts.109.down_proj", "model.layers.47.mlp.experts.110.down_proj", "model.layers.47.mlp.experts.111.down_proj", "model.layers.47.mlp.experts.112.down_proj", "model.layers.47.mlp.experts.113.down_proj", "model.layers.47.mlp.experts.114.down_proj", "model.layers.47.mlp.experts.115.down_proj", "model.layers.47.mlp.experts.116.down_proj", "model.layers.47.mlp.experts.117.down_proj", "model.layers.47.mlp.experts.118.down_proj", "model.layers.47.mlp.experts.119.down_proj", "model.layers.47.mlp.experts.120.down_proj", "model.layers.47.mlp.experts.121.down_proj", "model.layers.47.mlp.experts.122.down_proj", "model.layers.47.mlp.experts.123.down_proj", "model.layers.47.mlp.experts.124.down_proj", "model.layers.47.mlp.experts.125.down_proj", "model.layers.47.mlp.experts.126.down_proj", "model.layers.47.mlp.experts.127.down_proj", "model.layers.47.mlp.experts.128.down_proj", "model.layers.47.mlp.experts.129.down_proj", "model.layers.47.mlp.experts.130.down_proj", "model.layers.47.mlp.experts.131.down_proj", "model.layers.47.mlp.experts.132.down_proj", "model.layers.47.mlp.experts.133.down_proj", "model.layers.47.mlp.experts.134.down_proj", "model.layers.47.mlp.experts.135.down_proj", "model.layers.47.mlp.experts.136.down_proj", "model.layers.47.mlp.experts.137.down_proj", "model.layers.47.mlp.experts.138.down_proj", "model.layers.47.mlp.experts.139.down_proj", "model.layers.47.mlp.experts.140.down_proj", "model.layers.47.mlp.experts.141.down_proj", "model.layers.47.mlp.experts.142.down_proj", "model.layers.47.mlp.experts.143.down_proj", "model.layers.47.mlp.experts.144.down_proj", "model.layers.47.mlp.experts.145.down_proj", "model.layers.47.mlp.experts.146.down_proj", "model.layers.47.mlp.experts.147.down_proj", "model.layers.47.mlp.experts.148.down_proj", "model.layers.47.mlp.experts.149.down_proj", "model.layers.47.mlp.experts.150.down_proj", "model.layers.47.mlp.experts.151.down_proj", "model.layers.47.mlp.experts.152.down_proj", "model.layers.47.mlp.experts.153.down_proj", "model.layers.47.mlp.experts.154.down_proj", "model.layers.47.mlp.experts.155.down_proj", "model.layers.47.mlp.experts.156.down_proj", "model.layers.47.mlp.experts.157.down_proj", "model.layers.47.mlp.experts.158.down_proj", "model.layers.47.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.8651969730852647e-05, "dbits": 1258291200 }, { "dkld": -2.970963250845636e-05, "dbits": 2516582400 } ] }, { "idx": 285, "layers": [ "model.layers.48.self_attn.q_proj" ], "candidates": [ { "dkld": -6.924001500010352e-05, "dbits": 62914560 }, { "dkld": -4.03401441872106e-05, "dbits": 125829120 } ] }, { "idx": 286, "layers": [ "model.layers.48.self_attn.k_proj", "model.layers.48.self_attn.v_proj" ], "candidates": [ { "dkld": -0.0001358264358714209, "dbits": 10485760 }, { "dkld": -0.00012686483096331289, "dbits": 20971520 } ] }, { "idx": 287, "layers": [ "model.layers.48.self_attn.o_proj" ], "candidates": [ { "dkld": -1.761610619723658e-05, "dbits": 62914560 }, { "dkld": 9.373668581247677e-06, "dbits": 125829120 } ] }, { "idx": 288, "layers": [ "model.layers.48.mlp.shared_experts.gate_proj", "model.layers.48.mlp.shared_experts.up_proj", "model.layers.48.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 5.973069928586622e-05, "dbits": 23592960 }, { "dkld": 5.0002895295621005e-05, "dbits": 47185920 } ] }, { "idx": 289, "layers": [ "model.layers.48.mlp.experts.0.gate_proj", "model.layers.48.mlp.experts.1.gate_proj", "model.layers.48.mlp.experts.2.gate_proj", "model.layers.48.mlp.experts.3.gate_proj", "model.layers.48.mlp.experts.4.gate_proj", "model.layers.48.mlp.experts.5.gate_proj", "model.layers.48.mlp.experts.6.gate_proj", "model.layers.48.mlp.experts.7.gate_proj", "model.layers.48.mlp.experts.8.gate_proj", "model.layers.48.mlp.experts.9.gate_proj", "model.layers.48.mlp.experts.10.gate_proj", "model.layers.48.mlp.experts.11.gate_proj", "model.layers.48.mlp.experts.12.gate_proj", "model.layers.48.mlp.experts.13.gate_proj", "model.layers.48.mlp.experts.14.gate_proj", "model.layers.48.mlp.experts.15.gate_proj", "model.layers.48.mlp.experts.16.gate_proj", "model.layers.48.mlp.experts.17.gate_proj", "model.layers.48.mlp.experts.18.gate_proj", "model.layers.48.mlp.experts.19.gate_proj", "model.layers.48.mlp.experts.20.gate_proj", "model.layers.48.mlp.experts.21.gate_proj", "model.layers.48.mlp.experts.22.gate_proj", "model.layers.48.mlp.experts.23.gate_proj", "model.layers.48.mlp.experts.24.gate_proj", "model.layers.48.mlp.experts.25.gate_proj", "model.layers.48.mlp.experts.26.gate_proj", "model.layers.48.mlp.experts.27.gate_proj", "model.layers.48.mlp.experts.28.gate_proj", "model.layers.48.mlp.experts.29.gate_proj", "model.layers.48.mlp.experts.30.gate_proj", "model.layers.48.mlp.experts.31.gate_proj", "model.layers.48.mlp.experts.32.gate_proj", "model.layers.48.mlp.experts.33.gate_proj", "model.layers.48.mlp.experts.34.gate_proj", "model.layers.48.mlp.experts.35.gate_proj", "model.layers.48.mlp.experts.36.gate_proj", "model.layers.48.mlp.experts.37.gate_proj", "model.layers.48.mlp.experts.38.gate_proj", "model.layers.48.mlp.experts.39.gate_proj", "model.layers.48.mlp.experts.40.gate_proj", "model.layers.48.mlp.experts.41.gate_proj", "model.layers.48.mlp.experts.42.gate_proj", "model.layers.48.mlp.experts.43.gate_proj", "model.layers.48.mlp.experts.44.gate_proj", "model.layers.48.mlp.experts.45.gate_proj", "model.layers.48.mlp.experts.46.gate_proj", "model.layers.48.mlp.experts.47.gate_proj", "model.layers.48.mlp.experts.48.gate_proj", "model.layers.48.mlp.experts.49.gate_proj", "model.layers.48.mlp.experts.50.gate_proj", "model.layers.48.mlp.experts.51.gate_proj", "model.layers.48.mlp.experts.52.gate_proj", "model.layers.48.mlp.experts.53.gate_proj", "model.layers.48.mlp.experts.54.gate_proj", "model.layers.48.mlp.experts.55.gate_proj", "model.layers.48.mlp.experts.56.gate_proj", "model.layers.48.mlp.experts.57.gate_proj", "model.layers.48.mlp.experts.58.gate_proj", "model.layers.48.mlp.experts.59.gate_proj", "model.layers.48.mlp.experts.60.gate_proj", "model.layers.48.mlp.experts.61.gate_proj", "model.layers.48.mlp.experts.62.gate_proj", "model.layers.48.mlp.experts.63.gate_proj", "model.layers.48.mlp.experts.64.gate_proj", "model.layers.48.mlp.experts.65.gate_proj", "model.layers.48.mlp.experts.66.gate_proj", "model.layers.48.mlp.experts.67.gate_proj", "model.layers.48.mlp.experts.68.gate_proj", "model.layers.48.mlp.experts.69.gate_proj", "model.layers.48.mlp.experts.70.gate_proj", "model.layers.48.mlp.experts.71.gate_proj", "model.layers.48.mlp.experts.72.gate_proj", "model.layers.48.mlp.experts.73.gate_proj", "model.layers.48.mlp.experts.74.gate_proj", "model.layers.48.mlp.experts.75.gate_proj", "model.layers.48.mlp.experts.76.gate_proj", "model.layers.48.mlp.experts.77.gate_proj", "model.layers.48.mlp.experts.78.gate_proj", "model.layers.48.mlp.experts.79.gate_proj", "model.layers.48.mlp.experts.80.gate_proj", "model.layers.48.mlp.experts.81.gate_proj", "model.layers.48.mlp.experts.82.gate_proj", "model.layers.48.mlp.experts.83.gate_proj", "model.layers.48.mlp.experts.84.gate_proj", "model.layers.48.mlp.experts.85.gate_proj", "model.layers.48.mlp.experts.86.gate_proj", "model.layers.48.mlp.experts.87.gate_proj", "model.layers.48.mlp.experts.88.gate_proj", "model.layers.48.mlp.experts.89.gate_proj", "model.layers.48.mlp.experts.90.gate_proj", "model.layers.48.mlp.experts.91.gate_proj", "model.layers.48.mlp.experts.92.gate_proj", "model.layers.48.mlp.experts.93.gate_proj", "model.layers.48.mlp.experts.94.gate_proj", "model.layers.48.mlp.experts.95.gate_proj", "model.layers.48.mlp.experts.96.gate_proj", "model.layers.48.mlp.experts.97.gate_proj", "model.layers.48.mlp.experts.98.gate_proj", "model.layers.48.mlp.experts.99.gate_proj", "model.layers.48.mlp.experts.100.gate_proj", "model.layers.48.mlp.experts.101.gate_proj", "model.layers.48.mlp.experts.102.gate_proj", "model.layers.48.mlp.experts.103.gate_proj", "model.layers.48.mlp.experts.104.gate_proj", "model.layers.48.mlp.experts.105.gate_proj", "model.layers.48.mlp.experts.106.gate_proj", "model.layers.48.mlp.experts.107.gate_proj", "model.layers.48.mlp.experts.108.gate_proj", "model.layers.48.mlp.experts.109.gate_proj", "model.layers.48.mlp.experts.110.gate_proj", "model.layers.48.mlp.experts.111.gate_proj", "model.layers.48.mlp.experts.112.gate_proj", "model.layers.48.mlp.experts.113.gate_proj", "model.layers.48.mlp.experts.114.gate_proj", "model.layers.48.mlp.experts.115.gate_proj", "model.layers.48.mlp.experts.116.gate_proj", "model.layers.48.mlp.experts.117.gate_proj", "model.layers.48.mlp.experts.118.gate_proj", "model.layers.48.mlp.experts.119.gate_proj", "model.layers.48.mlp.experts.120.gate_proj", "model.layers.48.mlp.experts.121.gate_proj", "model.layers.48.mlp.experts.122.gate_proj", "model.layers.48.mlp.experts.123.gate_proj", "model.layers.48.mlp.experts.124.gate_proj", "model.layers.48.mlp.experts.125.gate_proj", "model.layers.48.mlp.experts.126.gate_proj", "model.layers.48.mlp.experts.127.gate_proj", "model.layers.48.mlp.experts.128.gate_proj", "model.layers.48.mlp.experts.129.gate_proj", "model.layers.48.mlp.experts.130.gate_proj", "model.layers.48.mlp.experts.131.gate_proj", "model.layers.48.mlp.experts.132.gate_proj", "model.layers.48.mlp.experts.133.gate_proj", "model.layers.48.mlp.experts.134.gate_proj", "model.layers.48.mlp.experts.135.gate_proj", "model.layers.48.mlp.experts.136.gate_proj", "model.layers.48.mlp.experts.137.gate_proj", "model.layers.48.mlp.experts.138.gate_proj", "model.layers.48.mlp.experts.139.gate_proj", "model.layers.48.mlp.experts.140.gate_proj", "model.layers.48.mlp.experts.141.gate_proj", "model.layers.48.mlp.experts.142.gate_proj", "model.layers.48.mlp.experts.143.gate_proj", "model.layers.48.mlp.experts.144.gate_proj", "model.layers.48.mlp.experts.145.gate_proj", "model.layers.48.mlp.experts.146.gate_proj", "model.layers.48.mlp.experts.147.gate_proj", "model.layers.48.mlp.experts.148.gate_proj", "model.layers.48.mlp.experts.149.gate_proj", "model.layers.48.mlp.experts.150.gate_proj", "model.layers.48.mlp.experts.151.gate_proj", "model.layers.48.mlp.experts.152.gate_proj", "model.layers.48.mlp.experts.153.gate_proj", "model.layers.48.mlp.experts.154.gate_proj", "model.layers.48.mlp.experts.155.gate_proj", "model.layers.48.mlp.experts.156.gate_proj", "model.layers.48.mlp.experts.157.gate_proj", "model.layers.48.mlp.experts.158.gate_proj", "model.layers.48.mlp.experts.159.gate_proj", "model.layers.48.mlp.experts.0.up_proj", "model.layers.48.mlp.experts.1.up_proj", "model.layers.48.mlp.experts.2.up_proj", "model.layers.48.mlp.experts.3.up_proj", "model.layers.48.mlp.experts.4.up_proj", "model.layers.48.mlp.experts.5.up_proj", "model.layers.48.mlp.experts.6.up_proj", "model.layers.48.mlp.experts.7.up_proj", "model.layers.48.mlp.experts.8.up_proj", "model.layers.48.mlp.experts.9.up_proj", "model.layers.48.mlp.experts.10.up_proj", "model.layers.48.mlp.experts.11.up_proj", "model.layers.48.mlp.experts.12.up_proj", "model.layers.48.mlp.experts.13.up_proj", "model.layers.48.mlp.experts.14.up_proj", "model.layers.48.mlp.experts.15.up_proj", "model.layers.48.mlp.experts.16.up_proj", "model.layers.48.mlp.experts.17.up_proj", "model.layers.48.mlp.experts.18.up_proj", "model.layers.48.mlp.experts.19.up_proj", "model.layers.48.mlp.experts.20.up_proj", "model.layers.48.mlp.experts.21.up_proj", "model.layers.48.mlp.experts.22.up_proj", "model.layers.48.mlp.experts.23.up_proj", "model.layers.48.mlp.experts.24.up_proj", "model.layers.48.mlp.experts.25.up_proj", "model.layers.48.mlp.experts.26.up_proj", "model.layers.48.mlp.experts.27.up_proj", "model.layers.48.mlp.experts.28.up_proj", "model.layers.48.mlp.experts.29.up_proj", "model.layers.48.mlp.experts.30.up_proj", "model.layers.48.mlp.experts.31.up_proj", "model.layers.48.mlp.experts.32.up_proj", "model.layers.48.mlp.experts.33.up_proj", "model.layers.48.mlp.experts.34.up_proj", "model.layers.48.mlp.experts.35.up_proj", "model.layers.48.mlp.experts.36.up_proj", "model.layers.48.mlp.experts.37.up_proj", "model.layers.48.mlp.experts.38.up_proj", "model.layers.48.mlp.experts.39.up_proj", "model.layers.48.mlp.experts.40.up_proj", "model.layers.48.mlp.experts.41.up_proj", "model.layers.48.mlp.experts.42.up_proj", "model.layers.48.mlp.experts.43.up_proj", "model.layers.48.mlp.experts.44.up_proj", "model.layers.48.mlp.experts.45.up_proj", "model.layers.48.mlp.experts.46.up_proj", "model.layers.48.mlp.experts.47.up_proj", "model.layers.48.mlp.experts.48.up_proj", "model.layers.48.mlp.experts.49.up_proj", "model.layers.48.mlp.experts.50.up_proj", "model.layers.48.mlp.experts.51.up_proj", "model.layers.48.mlp.experts.52.up_proj", "model.layers.48.mlp.experts.53.up_proj", "model.layers.48.mlp.experts.54.up_proj", "model.layers.48.mlp.experts.55.up_proj", "model.layers.48.mlp.experts.56.up_proj", "model.layers.48.mlp.experts.57.up_proj", "model.layers.48.mlp.experts.58.up_proj", "model.layers.48.mlp.experts.59.up_proj", "model.layers.48.mlp.experts.60.up_proj", "model.layers.48.mlp.experts.61.up_proj", "model.layers.48.mlp.experts.62.up_proj", "model.layers.48.mlp.experts.63.up_proj", "model.layers.48.mlp.experts.64.up_proj", "model.layers.48.mlp.experts.65.up_proj", "model.layers.48.mlp.experts.66.up_proj", "model.layers.48.mlp.experts.67.up_proj", "model.layers.48.mlp.experts.68.up_proj", "model.layers.48.mlp.experts.69.up_proj", "model.layers.48.mlp.experts.70.up_proj", "model.layers.48.mlp.experts.71.up_proj", "model.layers.48.mlp.experts.72.up_proj", "model.layers.48.mlp.experts.73.up_proj", "model.layers.48.mlp.experts.74.up_proj", "model.layers.48.mlp.experts.75.up_proj", "model.layers.48.mlp.experts.76.up_proj", "model.layers.48.mlp.experts.77.up_proj", "model.layers.48.mlp.experts.78.up_proj", "model.layers.48.mlp.experts.79.up_proj", "model.layers.48.mlp.experts.80.up_proj", "model.layers.48.mlp.experts.81.up_proj", "model.layers.48.mlp.experts.82.up_proj", "model.layers.48.mlp.experts.83.up_proj", "model.layers.48.mlp.experts.84.up_proj", "model.layers.48.mlp.experts.85.up_proj", "model.layers.48.mlp.experts.86.up_proj", "model.layers.48.mlp.experts.87.up_proj", "model.layers.48.mlp.experts.88.up_proj", "model.layers.48.mlp.experts.89.up_proj", "model.layers.48.mlp.experts.90.up_proj", "model.layers.48.mlp.experts.91.up_proj", "model.layers.48.mlp.experts.92.up_proj", "model.layers.48.mlp.experts.93.up_proj", "model.layers.48.mlp.experts.94.up_proj", "model.layers.48.mlp.experts.95.up_proj", "model.layers.48.mlp.experts.96.up_proj", "model.layers.48.mlp.experts.97.up_proj", "model.layers.48.mlp.experts.98.up_proj", "model.layers.48.mlp.experts.99.up_proj", "model.layers.48.mlp.experts.100.up_proj", "model.layers.48.mlp.experts.101.up_proj", "model.layers.48.mlp.experts.102.up_proj", "model.layers.48.mlp.experts.103.up_proj", "model.layers.48.mlp.experts.104.up_proj", "model.layers.48.mlp.experts.105.up_proj", "model.layers.48.mlp.experts.106.up_proj", "model.layers.48.mlp.experts.107.up_proj", "model.layers.48.mlp.experts.108.up_proj", "model.layers.48.mlp.experts.109.up_proj", "model.layers.48.mlp.experts.110.up_proj", "model.layers.48.mlp.experts.111.up_proj", "model.layers.48.mlp.experts.112.up_proj", "model.layers.48.mlp.experts.113.up_proj", "model.layers.48.mlp.experts.114.up_proj", "model.layers.48.mlp.experts.115.up_proj", "model.layers.48.mlp.experts.116.up_proj", "model.layers.48.mlp.experts.117.up_proj", "model.layers.48.mlp.experts.118.up_proj", "model.layers.48.mlp.experts.119.up_proj", "model.layers.48.mlp.experts.120.up_proj", "model.layers.48.mlp.experts.121.up_proj", "model.layers.48.mlp.experts.122.up_proj", "model.layers.48.mlp.experts.123.up_proj", "model.layers.48.mlp.experts.124.up_proj", "model.layers.48.mlp.experts.125.up_proj", "model.layers.48.mlp.experts.126.up_proj", "model.layers.48.mlp.experts.127.up_proj", "model.layers.48.mlp.experts.128.up_proj", "model.layers.48.mlp.experts.129.up_proj", "model.layers.48.mlp.experts.130.up_proj", "model.layers.48.mlp.experts.131.up_proj", "model.layers.48.mlp.experts.132.up_proj", "model.layers.48.mlp.experts.133.up_proj", "model.layers.48.mlp.experts.134.up_proj", "model.layers.48.mlp.experts.135.up_proj", "model.layers.48.mlp.experts.136.up_proj", "model.layers.48.mlp.experts.137.up_proj", "model.layers.48.mlp.experts.138.up_proj", "model.layers.48.mlp.experts.139.up_proj", "model.layers.48.mlp.experts.140.up_proj", "model.layers.48.mlp.experts.141.up_proj", "model.layers.48.mlp.experts.142.up_proj", "model.layers.48.mlp.experts.143.up_proj", "model.layers.48.mlp.experts.144.up_proj", "model.layers.48.mlp.experts.145.up_proj", "model.layers.48.mlp.experts.146.up_proj", "model.layers.48.mlp.experts.147.up_proj", "model.layers.48.mlp.experts.148.up_proj", "model.layers.48.mlp.experts.149.up_proj", "model.layers.48.mlp.experts.150.up_proj", "model.layers.48.mlp.experts.151.up_proj", "model.layers.48.mlp.experts.152.up_proj", "model.layers.48.mlp.experts.153.up_proj", "model.layers.48.mlp.experts.154.up_proj", "model.layers.48.mlp.experts.155.up_proj", "model.layers.48.mlp.experts.156.up_proj", "model.layers.48.mlp.experts.157.up_proj", "model.layers.48.mlp.experts.158.up_proj", "model.layers.48.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.3940175995231022e-05, "dbits": 2516582400 }, { "dkld": -9.22367908060516e-06, "dbits": 5033164800 } ] }, { "idx": 290, "layers": [ "model.layers.48.mlp.experts.0.down_proj", "model.layers.48.mlp.experts.1.down_proj", "model.layers.48.mlp.experts.2.down_proj", "model.layers.48.mlp.experts.3.down_proj", "model.layers.48.mlp.experts.4.down_proj", "model.layers.48.mlp.experts.5.down_proj", "model.layers.48.mlp.experts.6.down_proj", "model.layers.48.mlp.experts.7.down_proj", "model.layers.48.mlp.experts.8.down_proj", "model.layers.48.mlp.experts.9.down_proj", "model.layers.48.mlp.experts.10.down_proj", "model.layers.48.mlp.experts.11.down_proj", "model.layers.48.mlp.experts.12.down_proj", "model.layers.48.mlp.experts.13.down_proj", "model.layers.48.mlp.experts.14.down_proj", "model.layers.48.mlp.experts.15.down_proj", "model.layers.48.mlp.experts.16.down_proj", "model.layers.48.mlp.experts.17.down_proj", "model.layers.48.mlp.experts.18.down_proj", "model.layers.48.mlp.experts.19.down_proj", "model.layers.48.mlp.experts.20.down_proj", "model.layers.48.mlp.experts.21.down_proj", "model.layers.48.mlp.experts.22.down_proj", "model.layers.48.mlp.experts.23.down_proj", "model.layers.48.mlp.experts.24.down_proj", "model.layers.48.mlp.experts.25.down_proj", "model.layers.48.mlp.experts.26.down_proj", "model.layers.48.mlp.experts.27.down_proj", "model.layers.48.mlp.experts.28.down_proj", "model.layers.48.mlp.experts.29.down_proj", "model.layers.48.mlp.experts.30.down_proj", "model.layers.48.mlp.experts.31.down_proj", "model.layers.48.mlp.experts.32.down_proj", "model.layers.48.mlp.experts.33.down_proj", "model.layers.48.mlp.experts.34.down_proj", "model.layers.48.mlp.experts.35.down_proj", "model.layers.48.mlp.experts.36.down_proj", "model.layers.48.mlp.experts.37.down_proj", "model.layers.48.mlp.experts.38.down_proj", "model.layers.48.mlp.experts.39.down_proj", "model.layers.48.mlp.experts.40.down_proj", "model.layers.48.mlp.experts.41.down_proj", "model.layers.48.mlp.experts.42.down_proj", "model.layers.48.mlp.experts.43.down_proj", "model.layers.48.mlp.experts.44.down_proj", "model.layers.48.mlp.experts.45.down_proj", "model.layers.48.mlp.experts.46.down_proj", "model.layers.48.mlp.experts.47.down_proj", "model.layers.48.mlp.experts.48.down_proj", "model.layers.48.mlp.experts.49.down_proj", "model.layers.48.mlp.experts.50.down_proj", "model.layers.48.mlp.experts.51.down_proj", "model.layers.48.mlp.experts.52.down_proj", "model.layers.48.mlp.experts.53.down_proj", "model.layers.48.mlp.experts.54.down_proj", "model.layers.48.mlp.experts.55.down_proj", "model.layers.48.mlp.experts.56.down_proj", "model.layers.48.mlp.experts.57.down_proj", "model.layers.48.mlp.experts.58.down_proj", "model.layers.48.mlp.experts.59.down_proj", "model.layers.48.mlp.experts.60.down_proj", "model.layers.48.mlp.experts.61.down_proj", "model.layers.48.mlp.experts.62.down_proj", "model.layers.48.mlp.experts.63.down_proj", "model.layers.48.mlp.experts.64.down_proj", "model.layers.48.mlp.experts.65.down_proj", "model.layers.48.mlp.experts.66.down_proj", "model.layers.48.mlp.experts.67.down_proj", "model.layers.48.mlp.experts.68.down_proj", "model.layers.48.mlp.experts.69.down_proj", "model.layers.48.mlp.experts.70.down_proj", "model.layers.48.mlp.experts.71.down_proj", "model.layers.48.mlp.experts.72.down_proj", "model.layers.48.mlp.experts.73.down_proj", "model.layers.48.mlp.experts.74.down_proj", "model.layers.48.mlp.experts.75.down_proj", "model.layers.48.mlp.experts.76.down_proj", "model.layers.48.mlp.experts.77.down_proj", "model.layers.48.mlp.experts.78.down_proj", "model.layers.48.mlp.experts.79.down_proj", "model.layers.48.mlp.experts.80.down_proj", "model.layers.48.mlp.experts.81.down_proj", "model.layers.48.mlp.experts.82.down_proj", "model.layers.48.mlp.experts.83.down_proj", "model.layers.48.mlp.experts.84.down_proj", "model.layers.48.mlp.experts.85.down_proj", "model.layers.48.mlp.experts.86.down_proj", "model.layers.48.mlp.experts.87.down_proj", "model.layers.48.mlp.experts.88.down_proj", "model.layers.48.mlp.experts.89.down_proj", "model.layers.48.mlp.experts.90.down_proj", "model.layers.48.mlp.experts.91.down_proj", "model.layers.48.mlp.experts.92.down_proj", "model.layers.48.mlp.experts.93.down_proj", "model.layers.48.mlp.experts.94.down_proj", "model.layers.48.mlp.experts.95.down_proj", "model.layers.48.mlp.experts.96.down_proj", "model.layers.48.mlp.experts.97.down_proj", "model.layers.48.mlp.experts.98.down_proj", "model.layers.48.mlp.experts.99.down_proj", "model.layers.48.mlp.experts.100.down_proj", "model.layers.48.mlp.experts.101.down_proj", "model.layers.48.mlp.experts.102.down_proj", "model.layers.48.mlp.experts.103.down_proj", "model.layers.48.mlp.experts.104.down_proj", "model.layers.48.mlp.experts.105.down_proj", "model.layers.48.mlp.experts.106.down_proj", "model.layers.48.mlp.experts.107.down_proj", "model.layers.48.mlp.experts.108.down_proj", "model.layers.48.mlp.experts.109.down_proj", "model.layers.48.mlp.experts.110.down_proj", "model.layers.48.mlp.experts.111.down_proj", "model.layers.48.mlp.experts.112.down_proj", "model.layers.48.mlp.experts.113.down_proj", "model.layers.48.mlp.experts.114.down_proj", "model.layers.48.mlp.experts.115.down_proj", "model.layers.48.mlp.experts.116.down_proj", "model.layers.48.mlp.experts.117.down_proj", "model.layers.48.mlp.experts.118.down_proj", "model.layers.48.mlp.experts.119.down_proj", "model.layers.48.mlp.experts.120.down_proj", "model.layers.48.mlp.experts.121.down_proj", "model.layers.48.mlp.experts.122.down_proj", "model.layers.48.mlp.experts.123.down_proj", "model.layers.48.mlp.experts.124.down_proj", "model.layers.48.mlp.experts.125.down_proj", "model.layers.48.mlp.experts.126.down_proj", "model.layers.48.mlp.experts.127.down_proj", "model.layers.48.mlp.experts.128.down_proj", "model.layers.48.mlp.experts.129.down_proj", "model.layers.48.mlp.experts.130.down_proj", "model.layers.48.mlp.experts.131.down_proj", "model.layers.48.mlp.experts.132.down_proj", "model.layers.48.mlp.experts.133.down_proj", "model.layers.48.mlp.experts.134.down_proj", "model.layers.48.mlp.experts.135.down_proj", "model.layers.48.mlp.experts.136.down_proj", "model.layers.48.mlp.experts.137.down_proj", "model.layers.48.mlp.experts.138.down_proj", "model.layers.48.mlp.experts.139.down_proj", "model.layers.48.mlp.experts.140.down_proj", "model.layers.48.mlp.experts.141.down_proj", "model.layers.48.mlp.experts.142.down_proj", "model.layers.48.mlp.experts.143.down_proj", "model.layers.48.mlp.experts.144.down_proj", "model.layers.48.mlp.experts.145.down_proj", "model.layers.48.mlp.experts.146.down_proj", "model.layers.48.mlp.experts.147.down_proj", "model.layers.48.mlp.experts.148.down_proj", "model.layers.48.mlp.experts.149.down_proj", "model.layers.48.mlp.experts.150.down_proj", "model.layers.48.mlp.experts.151.down_proj", "model.layers.48.mlp.experts.152.down_proj", "model.layers.48.mlp.experts.153.down_proj", "model.layers.48.mlp.experts.154.down_proj", "model.layers.48.mlp.experts.155.down_proj", "model.layers.48.mlp.experts.156.down_proj", "model.layers.48.mlp.experts.157.down_proj", "model.layers.48.mlp.experts.158.down_proj", "model.layers.48.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.822009846568073e-05, "dbits": 1258291200 }, { "dkld": -1.0742526501416466e-05, "dbits": 2516582400 } ] }, { "idx": 291, "layers": [ "model.layers.49.self_attn.q_proj" ], "candidates": [ { "dkld": -4.721153527497204e-06, "dbits": 62914560 }, { "dkld": 1.912231091409991e-05, "dbits": 125829120 } ] }, { "idx": 292, "layers": [ "model.layers.49.self_attn.k_proj", "model.layers.49.self_attn.v_proj" ], "candidates": [ { "dkld": -6.633379962295294e-05, "dbits": 10485760 }, { "dkld": -6.940187886357238e-05, "dbits": 20971520 } ] }, { "idx": 293, "layers": [ "model.layers.49.self_attn.o_proj" ], "candidates": [ { "dkld": 2.85298097878698e-05, "dbits": 62914560 }, { "dkld": 3.957028966397082e-05, "dbits": 125829120 } ] }, { "idx": 294, "layers": [ "model.layers.49.mlp.shared_experts.gate_proj", "model.layers.49.mlp.shared_experts.up_proj", "model.layers.49.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -2.8919265605508587e-05, "dbits": 23592960 }, { "dkld": -8.720811456440491e-06, "dbits": 47185920 } ] }, { "idx": 295, "layers": [ "model.layers.49.mlp.experts.0.gate_proj", "model.layers.49.mlp.experts.1.gate_proj", "model.layers.49.mlp.experts.2.gate_proj", "model.layers.49.mlp.experts.3.gate_proj", "model.layers.49.mlp.experts.4.gate_proj", "model.layers.49.mlp.experts.5.gate_proj", "model.layers.49.mlp.experts.6.gate_proj", "model.layers.49.mlp.experts.7.gate_proj", "model.layers.49.mlp.experts.8.gate_proj", "model.layers.49.mlp.experts.9.gate_proj", "model.layers.49.mlp.experts.10.gate_proj", "model.layers.49.mlp.experts.11.gate_proj", "model.layers.49.mlp.experts.12.gate_proj", "model.layers.49.mlp.experts.13.gate_proj", "model.layers.49.mlp.experts.14.gate_proj", "model.layers.49.mlp.experts.15.gate_proj", "model.layers.49.mlp.experts.16.gate_proj", "model.layers.49.mlp.experts.17.gate_proj", "model.layers.49.mlp.experts.18.gate_proj", "model.layers.49.mlp.experts.19.gate_proj", "model.layers.49.mlp.experts.20.gate_proj", "model.layers.49.mlp.experts.21.gate_proj", "model.layers.49.mlp.experts.22.gate_proj", "model.layers.49.mlp.experts.23.gate_proj", "model.layers.49.mlp.experts.24.gate_proj", "model.layers.49.mlp.experts.25.gate_proj", "model.layers.49.mlp.experts.26.gate_proj", "model.layers.49.mlp.experts.27.gate_proj", "model.layers.49.mlp.experts.28.gate_proj", "model.layers.49.mlp.experts.29.gate_proj", "model.layers.49.mlp.experts.30.gate_proj", "model.layers.49.mlp.experts.31.gate_proj", "model.layers.49.mlp.experts.32.gate_proj", "model.layers.49.mlp.experts.33.gate_proj", "model.layers.49.mlp.experts.34.gate_proj", "model.layers.49.mlp.experts.35.gate_proj", "model.layers.49.mlp.experts.36.gate_proj", "model.layers.49.mlp.experts.37.gate_proj", "model.layers.49.mlp.experts.38.gate_proj", "model.layers.49.mlp.experts.39.gate_proj", "model.layers.49.mlp.experts.40.gate_proj", "model.layers.49.mlp.experts.41.gate_proj", "model.layers.49.mlp.experts.42.gate_proj", "model.layers.49.mlp.experts.43.gate_proj", "model.layers.49.mlp.experts.44.gate_proj", "model.layers.49.mlp.experts.45.gate_proj", "model.layers.49.mlp.experts.46.gate_proj", "model.layers.49.mlp.experts.47.gate_proj", "model.layers.49.mlp.experts.48.gate_proj", "model.layers.49.mlp.experts.49.gate_proj", "model.layers.49.mlp.experts.50.gate_proj", "model.layers.49.mlp.experts.51.gate_proj", "model.layers.49.mlp.experts.52.gate_proj", "model.layers.49.mlp.experts.53.gate_proj", "model.layers.49.mlp.experts.54.gate_proj", "model.layers.49.mlp.experts.55.gate_proj", "model.layers.49.mlp.experts.56.gate_proj", "model.layers.49.mlp.experts.57.gate_proj", "model.layers.49.mlp.experts.58.gate_proj", "model.layers.49.mlp.experts.59.gate_proj", "model.layers.49.mlp.experts.60.gate_proj", "model.layers.49.mlp.experts.61.gate_proj", "model.layers.49.mlp.experts.62.gate_proj", "model.layers.49.mlp.experts.63.gate_proj", "model.layers.49.mlp.experts.64.gate_proj", "model.layers.49.mlp.experts.65.gate_proj", "model.layers.49.mlp.experts.66.gate_proj", "model.layers.49.mlp.experts.67.gate_proj", "model.layers.49.mlp.experts.68.gate_proj", "model.layers.49.mlp.experts.69.gate_proj", "model.layers.49.mlp.experts.70.gate_proj", "model.layers.49.mlp.experts.71.gate_proj", "model.layers.49.mlp.experts.72.gate_proj", "model.layers.49.mlp.experts.73.gate_proj", "model.layers.49.mlp.experts.74.gate_proj", "model.layers.49.mlp.experts.75.gate_proj", "model.layers.49.mlp.experts.76.gate_proj", "model.layers.49.mlp.experts.77.gate_proj", "model.layers.49.mlp.experts.78.gate_proj", "model.layers.49.mlp.experts.79.gate_proj", "model.layers.49.mlp.experts.80.gate_proj", "model.layers.49.mlp.experts.81.gate_proj", "model.layers.49.mlp.experts.82.gate_proj", "model.layers.49.mlp.experts.83.gate_proj", "model.layers.49.mlp.experts.84.gate_proj", "model.layers.49.mlp.experts.85.gate_proj", "model.layers.49.mlp.experts.86.gate_proj", "model.layers.49.mlp.experts.87.gate_proj", "model.layers.49.mlp.experts.88.gate_proj", "model.layers.49.mlp.experts.89.gate_proj", "model.layers.49.mlp.experts.90.gate_proj", "model.layers.49.mlp.experts.91.gate_proj", "model.layers.49.mlp.experts.92.gate_proj", "model.layers.49.mlp.experts.93.gate_proj", "model.layers.49.mlp.experts.94.gate_proj", "model.layers.49.mlp.experts.95.gate_proj", "model.layers.49.mlp.experts.96.gate_proj", "model.layers.49.mlp.experts.97.gate_proj", "model.layers.49.mlp.experts.98.gate_proj", "model.layers.49.mlp.experts.99.gate_proj", "model.layers.49.mlp.experts.100.gate_proj", "model.layers.49.mlp.experts.101.gate_proj", "model.layers.49.mlp.experts.102.gate_proj", "model.layers.49.mlp.experts.103.gate_proj", "model.layers.49.mlp.experts.104.gate_proj", "model.layers.49.mlp.experts.105.gate_proj", "model.layers.49.mlp.experts.106.gate_proj", "model.layers.49.mlp.experts.107.gate_proj", "model.layers.49.mlp.experts.108.gate_proj", "model.layers.49.mlp.experts.109.gate_proj", "model.layers.49.mlp.experts.110.gate_proj", "model.layers.49.mlp.experts.111.gate_proj", "model.layers.49.mlp.experts.112.gate_proj", "model.layers.49.mlp.experts.113.gate_proj", "model.layers.49.mlp.experts.114.gate_proj", "model.layers.49.mlp.experts.115.gate_proj", "model.layers.49.mlp.experts.116.gate_proj", "model.layers.49.mlp.experts.117.gate_proj", "model.layers.49.mlp.experts.118.gate_proj", "model.layers.49.mlp.experts.119.gate_proj", "model.layers.49.mlp.experts.120.gate_proj", "model.layers.49.mlp.experts.121.gate_proj", "model.layers.49.mlp.experts.122.gate_proj", "model.layers.49.mlp.experts.123.gate_proj", "model.layers.49.mlp.experts.124.gate_proj", "model.layers.49.mlp.experts.125.gate_proj", "model.layers.49.mlp.experts.126.gate_proj", "model.layers.49.mlp.experts.127.gate_proj", "model.layers.49.mlp.experts.128.gate_proj", "model.layers.49.mlp.experts.129.gate_proj", "model.layers.49.mlp.experts.130.gate_proj", "model.layers.49.mlp.experts.131.gate_proj", "model.layers.49.mlp.experts.132.gate_proj", "model.layers.49.mlp.experts.133.gate_proj", "model.layers.49.mlp.experts.134.gate_proj", "model.layers.49.mlp.experts.135.gate_proj", "model.layers.49.mlp.experts.136.gate_proj", "model.layers.49.mlp.experts.137.gate_proj", "model.layers.49.mlp.experts.138.gate_proj", "model.layers.49.mlp.experts.139.gate_proj", "model.layers.49.mlp.experts.140.gate_proj", "model.layers.49.mlp.experts.141.gate_proj", "model.layers.49.mlp.experts.142.gate_proj", "model.layers.49.mlp.experts.143.gate_proj", "model.layers.49.mlp.experts.144.gate_proj", "model.layers.49.mlp.experts.145.gate_proj", "model.layers.49.mlp.experts.146.gate_proj", "model.layers.49.mlp.experts.147.gate_proj", "model.layers.49.mlp.experts.148.gate_proj", "model.layers.49.mlp.experts.149.gate_proj", "model.layers.49.mlp.experts.150.gate_proj", "model.layers.49.mlp.experts.151.gate_proj", "model.layers.49.mlp.experts.152.gate_proj", "model.layers.49.mlp.experts.153.gate_proj", "model.layers.49.mlp.experts.154.gate_proj", "model.layers.49.mlp.experts.155.gate_proj", "model.layers.49.mlp.experts.156.gate_proj", "model.layers.49.mlp.experts.157.gate_proj", "model.layers.49.mlp.experts.158.gate_proj", "model.layers.49.mlp.experts.159.gate_proj", "model.layers.49.mlp.experts.0.up_proj", "model.layers.49.mlp.experts.1.up_proj", "model.layers.49.mlp.experts.2.up_proj", "model.layers.49.mlp.experts.3.up_proj", "model.layers.49.mlp.experts.4.up_proj", "model.layers.49.mlp.experts.5.up_proj", "model.layers.49.mlp.experts.6.up_proj", "model.layers.49.mlp.experts.7.up_proj", "model.layers.49.mlp.experts.8.up_proj", "model.layers.49.mlp.experts.9.up_proj", "model.layers.49.mlp.experts.10.up_proj", "model.layers.49.mlp.experts.11.up_proj", "model.layers.49.mlp.experts.12.up_proj", "model.layers.49.mlp.experts.13.up_proj", "model.layers.49.mlp.experts.14.up_proj", "model.layers.49.mlp.experts.15.up_proj", "model.layers.49.mlp.experts.16.up_proj", "model.layers.49.mlp.experts.17.up_proj", "model.layers.49.mlp.experts.18.up_proj", "model.layers.49.mlp.experts.19.up_proj", "model.layers.49.mlp.experts.20.up_proj", "model.layers.49.mlp.experts.21.up_proj", "model.layers.49.mlp.experts.22.up_proj", "model.layers.49.mlp.experts.23.up_proj", "model.layers.49.mlp.experts.24.up_proj", "model.layers.49.mlp.experts.25.up_proj", "model.layers.49.mlp.experts.26.up_proj", "model.layers.49.mlp.experts.27.up_proj", "model.layers.49.mlp.experts.28.up_proj", "model.layers.49.mlp.experts.29.up_proj", "model.layers.49.mlp.experts.30.up_proj", "model.layers.49.mlp.experts.31.up_proj", "model.layers.49.mlp.experts.32.up_proj", "model.layers.49.mlp.experts.33.up_proj", "model.layers.49.mlp.experts.34.up_proj", "model.layers.49.mlp.experts.35.up_proj", "model.layers.49.mlp.experts.36.up_proj", "model.layers.49.mlp.experts.37.up_proj", "model.layers.49.mlp.experts.38.up_proj", "model.layers.49.mlp.experts.39.up_proj", "model.layers.49.mlp.experts.40.up_proj", "model.layers.49.mlp.experts.41.up_proj", "model.layers.49.mlp.experts.42.up_proj", "model.layers.49.mlp.experts.43.up_proj", "model.layers.49.mlp.experts.44.up_proj", "model.layers.49.mlp.experts.45.up_proj", "model.layers.49.mlp.experts.46.up_proj", "model.layers.49.mlp.experts.47.up_proj", "model.layers.49.mlp.experts.48.up_proj", "model.layers.49.mlp.experts.49.up_proj", "model.layers.49.mlp.experts.50.up_proj", "model.layers.49.mlp.experts.51.up_proj", "model.layers.49.mlp.experts.52.up_proj", "model.layers.49.mlp.experts.53.up_proj", "model.layers.49.mlp.experts.54.up_proj", "model.layers.49.mlp.experts.55.up_proj", "model.layers.49.mlp.experts.56.up_proj", "model.layers.49.mlp.experts.57.up_proj", "model.layers.49.mlp.experts.58.up_proj", "model.layers.49.mlp.experts.59.up_proj", "model.layers.49.mlp.experts.60.up_proj", "model.layers.49.mlp.experts.61.up_proj", "model.layers.49.mlp.experts.62.up_proj", "model.layers.49.mlp.experts.63.up_proj", "model.layers.49.mlp.experts.64.up_proj", "model.layers.49.mlp.experts.65.up_proj", "model.layers.49.mlp.experts.66.up_proj", "model.layers.49.mlp.experts.67.up_proj", "model.layers.49.mlp.experts.68.up_proj", "model.layers.49.mlp.experts.69.up_proj", "model.layers.49.mlp.experts.70.up_proj", "model.layers.49.mlp.experts.71.up_proj", "model.layers.49.mlp.experts.72.up_proj", "model.layers.49.mlp.experts.73.up_proj", "model.layers.49.mlp.experts.74.up_proj", "model.layers.49.mlp.experts.75.up_proj", "model.layers.49.mlp.experts.76.up_proj", "model.layers.49.mlp.experts.77.up_proj", "model.layers.49.mlp.experts.78.up_proj", "model.layers.49.mlp.experts.79.up_proj", "model.layers.49.mlp.experts.80.up_proj", "model.layers.49.mlp.experts.81.up_proj", "model.layers.49.mlp.experts.82.up_proj", "model.layers.49.mlp.experts.83.up_proj", "model.layers.49.mlp.experts.84.up_proj", "model.layers.49.mlp.experts.85.up_proj", "model.layers.49.mlp.experts.86.up_proj", "model.layers.49.mlp.experts.87.up_proj", "model.layers.49.mlp.experts.88.up_proj", "model.layers.49.mlp.experts.89.up_proj", "model.layers.49.mlp.experts.90.up_proj", "model.layers.49.mlp.experts.91.up_proj", "model.layers.49.mlp.experts.92.up_proj", "model.layers.49.mlp.experts.93.up_proj", "model.layers.49.mlp.experts.94.up_proj", "model.layers.49.mlp.experts.95.up_proj", "model.layers.49.mlp.experts.96.up_proj", "model.layers.49.mlp.experts.97.up_proj", "model.layers.49.mlp.experts.98.up_proj", "model.layers.49.mlp.experts.99.up_proj", "model.layers.49.mlp.experts.100.up_proj", "model.layers.49.mlp.experts.101.up_proj", "model.layers.49.mlp.experts.102.up_proj", "model.layers.49.mlp.experts.103.up_proj", "model.layers.49.mlp.experts.104.up_proj", "model.layers.49.mlp.experts.105.up_proj", "model.layers.49.mlp.experts.106.up_proj", "model.layers.49.mlp.experts.107.up_proj", "model.layers.49.mlp.experts.108.up_proj", "model.layers.49.mlp.experts.109.up_proj", "model.layers.49.mlp.experts.110.up_proj", "model.layers.49.mlp.experts.111.up_proj", "model.layers.49.mlp.experts.112.up_proj", "model.layers.49.mlp.experts.113.up_proj", "model.layers.49.mlp.experts.114.up_proj", "model.layers.49.mlp.experts.115.up_proj", "model.layers.49.mlp.experts.116.up_proj", "model.layers.49.mlp.experts.117.up_proj", "model.layers.49.mlp.experts.118.up_proj", "model.layers.49.mlp.experts.119.up_proj", "model.layers.49.mlp.experts.120.up_proj", "model.layers.49.mlp.experts.121.up_proj", "model.layers.49.mlp.experts.122.up_proj", "model.layers.49.mlp.experts.123.up_proj", "model.layers.49.mlp.experts.124.up_proj", "model.layers.49.mlp.experts.125.up_proj", "model.layers.49.mlp.experts.126.up_proj", "model.layers.49.mlp.experts.127.up_proj", "model.layers.49.mlp.experts.128.up_proj", "model.layers.49.mlp.experts.129.up_proj", "model.layers.49.mlp.experts.130.up_proj", "model.layers.49.mlp.experts.131.up_proj", "model.layers.49.mlp.experts.132.up_proj", "model.layers.49.mlp.experts.133.up_proj", "model.layers.49.mlp.experts.134.up_proj", "model.layers.49.mlp.experts.135.up_proj", "model.layers.49.mlp.experts.136.up_proj", "model.layers.49.mlp.experts.137.up_proj", "model.layers.49.mlp.experts.138.up_proj", "model.layers.49.mlp.experts.139.up_proj", "model.layers.49.mlp.experts.140.up_proj", "model.layers.49.mlp.experts.141.up_proj", "model.layers.49.mlp.experts.142.up_proj", "model.layers.49.mlp.experts.143.up_proj", "model.layers.49.mlp.experts.144.up_proj", "model.layers.49.mlp.experts.145.up_proj", "model.layers.49.mlp.experts.146.up_proj", "model.layers.49.mlp.experts.147.up_proj", "model.layers.49.mlp.experts.148.up_proj", "model.layers.49.mlp.experts.149.up_proj", "model.layers.49.mlp.experts.150.up_proj", "model.layers.49.mlp.experts.151.up_proj", "model.layers.49.mlp.experts.152.up_proj", "model.layers.49.mlp.experts.153.up_proj", "model.layers.49.mlp.experts.154.up_proj", "model.layers.49.mlp.experts.155.up_proj", "model.layers.49.mlp.experts.156.up_proj", "model.layers.49.mlp.experts.157.up_proj", "model.layers.49.mlp.experts.158.up_proj", "model.layers.49.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.3326842822133454e-05, "dbits": 2516582400 }, { "dkld": -1.1521391570568085e-05, "dbits": 5033164800 } ] }, { "idx": 296, "layers": [ "model.layers.49.mlp.experts.0.down_proj", "model.layers.49.mlp.experts.1.down_proj", "model.layers.49.mlp.experts.2.down_proj", "model.layers.49.mlp.experts.3.down_proj", "model.layers.49.mlp.experts.4.down_proj", "model.layers.49.mlp.experts.5.down_proj", "model.layers.49.mlp.experts.6.down_proj", "model.layers.49.mlp.experts.7.down_proj", "model.layers.49.mlp.experts.8.down_proj", "model.layers.49.mlp.experts.9.down_proj", "model.layers.49.mlp.experts.10.down_proj", "model.layers.49.mlp.experts.11.down_proj", "model.layers.49.mlp.experts.12.down_proj", "model.layers.49.mlp.experts.13.down_proj", "model.layers.49.mlp.experts.14.down_proj", "model.layers.49.mlp.experts.15.down_proj", "model.layers.49.mlp.experts.16.down_proj", "model.layers.49.mlp.experts.17.down_proj", "model.layers.49.mlp.experts.18.down_proj", "model.layers.49.mlp.experts.19.down_proj", "model.layers.49.mlp.experts.20.down_proj", "model.layers.49.mlp.experts.21.down_proj", "model.layers.49.mlp.experts.22.down_proj", "model.layers.49.mlp.experts.23.down_proj", "model.layers.49.mlp.experts.24.down_proj", "model.layers.49.mlp.experts.25.down_proj", "model.layers.49.mlp.experts.26.down_proj", "model.layers.49.mlp.experts.27.down_proj", "model.layers.49.mlp.experts.28.down_proj", "model.layers.49.mlp.experts.29.down_proj", "model.layers.49.mlp.experts.30.down_proj", "model.layers.49.mlp.experts.31.down_proj", "model.layers.49.mlp.experts.32.down_proj", "model.layers.49.mlp.experts.33.down_proj", "model.layers.49.mlp.experts.34.down_proj", "model.layers.49.mlp.experts.35.down_proj", "model.layers.49.mlp.experts.36.down_proj", "model.layers.49.mlp.experts.37.down_proj", "model.layers.49.mlp.experts.38.down_proj", "model.layers.49.mlp.experts.39.down_proj", "model.layers.49.mlp.experts.40.down_proj", "model.layers.49.mlp.experts.41.down_proj", "model.layers.49.mlp.experts.42.down_proj", "model.layers.49.mlp.experts.43.down_proj", "model.layers.49.mlp.experts.44.down_proj", "model.layers.49.mlp.experts.45.down_proj", "model.layers.49.mlp.experts.46.down_proj", "model.layers.49.mlp.experts.47.down_proj", "model.layers.49.mlp.experts.48.down_proj", "model.layers.49.mlp.experts.49.down_proj", "model.layers.49.mlp.experts.50.down_proj", "model.layers.49.mlp.experts.51.down_proj", "model.layers.49.mlp.experts.52.down_proj", "model.layers.49.mlp.experts.53.down_proj", "model.layers.49.mlp.experts.54.down_proj", "model.layers.49.mlp.experts.55.down_proj", "model.layers.49.mlp.experts.56.down_proj", "model.layers.49.mlp.experts.57.down_proj", "model.layers.49.mlp.experts.58.down_proj", "model.layers.49.mlp.experts.59.down_proj", "model.layers.49.mlp.experts.60.down_proj", "model.layers.49.mlp.experts.61.down_proj", "model.layers.49.mlp.experts.62.down_proj", "model.layers.49.mlp.experts.63.down_proj", "model.layers.49.mlp.experts.64.down_proj", "model.layers.49.mlp.experts.65.down_proj", "model.layers.49.mlp.experts.66.down_proj", "model.layers.49.mlp.experts.67.down_proj", "model.layers.49.mlp.experts.68.down_proj", "model.layers.49.mlp.experts.69.down_proj", "model.layers.49.mlp.experts.70.down_proj", "model.layers.49.mlp.experts.71.down_proj", "model.layers.49.mlp.experts.72.down_proj", "model.layers.49.mlp.experts.73.down_proj", "model.layers.49.mlp.experts.74.down_proj", "model.layers.49.mlp.experts.75.down_proj", "model.layers.49.mlp.experts.76.down_proj", "model.layers.49.mlp.experts.77.down_proj", "model.layers.49.mlp.experts.78.down_proj", "model.layers.49.mlp.experts.79.down_proj", "model.layers.49.mlp.experts.80.down_proj", "model.layers.49.mlp.experts.81.down_proj", "model.layers.49.mlp.experts.82.down_proj", "model.layers.49.mlp.experts.83.down_proj", "model.layers.49.mlp.experts.84.down_proj", "model.layers.49.mlp.experts.85.down_proj", "model.layers.49.mlp.experts.86.down_proj", "model.layers.49.mlp.experts.87.down_proj", "model.layers.49.mlp.experts.88.down_proj", "model.layers.49.mlp.experts.89.down_proj", "model.layers.49.mlp.experts.90.down_proj", "model.layers.49.mlp.experts.91.down_proj", "model.layers.49.mlp.experts.92.down_proj", "model.layers.49.mlp.experts.93.down_proj", "model.layers.49.mlp.experts.94.down_proj", "model.layers.49.mlp.experts.95.down_proj", "model.layers.49.mlp.experts.96.down_proj", "model.layers.49.mlp.experts.97.down_proj", "model.layers.49.mlp.experts.98.down_proj", "model.layers.49.mlp.experts.99.down_proj", "model.layers.49.mlp.experts.100.down_proj", "model.layers.49.mlp.experts.101.down_proj", "model.layers.49.mlp.experts.102.down_proj", "model.layers.49.mlp.experts.103.down_proj", "model.layers.49.mlp.experts.104.down_proj", "model.layers.49.mlp.experts.105.down_proj", "model.layers.49.mlp.experts.106.down_proj", "model.layers.49.mlp.experts.107.down_proj", "model.layers.49.mlp.experts.108.down_proj", "model.layers.49.mlp.experts.109.down_proj", "model.layers.49.mlp.experts.110.down_proj", "model.layers.49.mlp.experts.111.down_proj", "model.layers.49.mlp.experts.112.down_proj", "model.layers.49.mlp.experts.113.down_proj", "model.layers.49.mlp.experts.114.down_proj", "model.layers.49.mlp.experts.115.down_proj", "model.layers.49.mlp.experts.116.down_proj", "model.layers.49.mlp.experts.117.down_proj", "model.layers.49.mlp.experts.118.down_proj", "model.layers.49.mlp.experts.119.down_proj", "model.layers.49.mlp.experts.120.down_proj", "model.layers.49.mlp.experts.121.down_proj", "model.layers.49.mlp.experts.122.down_proj", "model.layers.49.mlp.experts.123.down_proj", "model.layers.49.mlp.experts.124.down_proj", "model.layers.49.mlp.experts.125.down_proj", "model.layers.49.mlp.experts.126.down_proj", "model.layers.49.mlp.experts.127.down_proj", "model.layers.49.mlp.experts.128.down_proj", "model.layers.49.mlp.experts.129.down_proj", "model.layers.49.mlp.experts.130.down_proj", "model.layers.49.mlp.experts.131.down_proj", "model.layers.49.mlp.experts.132.down_proj", "model.layers.49.mlp.experts.133.down_proj", "model.layers.49.mlp.experts.134.down_proj", "model.layers.49.mlp.experts.135.down_proj", "model.layers.49.mlp.experts.136.down_proj", "model.layers.49.mlp.experts.137.down_proj", "model.layers.49.mlp.experts.138.down_proj", "model.layers.49.mlp.experts.139.down_proj", "model.layers.49.mlp.experts.140.down_proj", "model.layers.49.mlp.experts.141.down_proj", "model.layers.49.mlp.experts.142.down_proj", "model.layers.49.mlp.experts.143.down_proj", "model.layers.49.mlp.experts.144.down_proj", "model.layers.49.mlp.experts.145.down_proj", "model.layers.49.mlp.experts.146.down_proj", "model.layers.49.mlp.experts.147.down_proj", "model.layers.49.mlp.experts.148.down_proj", "model.layers.49.mlp.experts.149.down_proj", "model.layers.49.mlp.experts.150.down_proj", "model.layers.49.mlp.experts.151.down_proj", "model.layers.49.mlp.experts.152.down_proj", "model.layers.49.mlp.experts.153.down_proj", "model.layers.49.mlp.experts.154.down_proj", "model.layers.49.mlp.experts.155.down_proj", "model.layers.49.mlp.experts.156.down_proj", "model.layers.49.mlp.experts.157.down_proj", "model.layers.49.mlp.experts.158.down_proj", "model.layers.49.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 3.4886645153171802e-06, "dbits": 1258291200 }, { "dkld": -3.5223551094528543e-06, "dbits": 2516582400 } ] }, { "idx": 297, "layers": [ "model.layers.50.self_attn.q_proj" ], "candidates": [ { "dkld": 1.8688850104808807e-05, "dbits": 62914560 }, { "dkld": 1.7657852731646495e-05, "dbits": 125829120 } ] }, { "idx": 298, "layers": [ "model.layers.50.self_attn.k_proj", "model.layers.50.self_attn.v_proj" ], "candidates": [ { "dkld": -6.895128171890974e-05, "dbits": 10485760 }, { "dkld": -9.969330858439207e-05, "dbits": 20971520 } ] }, { "idx": 299, "layers": [ "model.layers.50.self_attn.o_proj" ], "candidates": [ { "dkld": -4.489959683269193e-05, "dbits": 62914560 }, { "dkld": -3.113090060651198e-05, "dbits": 125829120 } ] }, { "idx": 300, "layers": [ "model.layers.50.mlp.shared_experts.gate_proj", "model.layers.50.mlp.shared_experts.up_proj", "model.layers.50.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -1.341362949460606e-05, "dbits": 23592960 }, { "dkld": -2.953084185719143e-06, "dbits": 47185920 } ] }, { "idx": 301, "layers": [ "model.layers.50.mlp.experts.0.gate_proj", "model.layers.50.mlp.experts.1.gate_proj", "model.layers.50.mlp.experts.2.gate_proj", "model.layers.50.mlp.experts.3.gate_proj", "model.layers.50.mlp.experts.4.gate_proj", "model.layers.50.mlp.experts.5.gate_proj", "model.layers.50.mlp.experts.6.gate_proj", "model.layers.50.mlp.experts.7.gate_proj", "model.layers.50.mlp.experts.8.gate_proj", "model.layers.50.mlp.experts.9.gate_proj", "model.layers.50.mlp.experts.10.gate_proj", "model.layers.50.mlp.experts.11.gate_proj", "model.layers.50.mlp.experts.12.gate_proj", "model.layers.50.mlp.experts.13.gate_proj", "model.layers.50.mlp.experts.14.gate_proj", "model.layers.50.mlp.experts.15.gate_proj", "model.layers.50.mlp.experts.16.gate_proj", "model.layers.50.mlp.experts.17.gate_proj", "model.layers.50.mlp.experts.18.gate_proj", "model.layers.50.mlp.experts.19.gate_proj", "model.layers.50.mlp.experts.20.gate_proj", "model.layers.50.mlp.experts.21.gate_proj", "model.layers.50.mlp.experts.22.gate_proj", "model.layers.50.mlp.experts.23.gate_proj", "model.layers.50.mlp.experts.24.gate_proj", "model.layers.50.mlp.experts.25.gate_proj", "model.layers.50.mlp.experts.26.gate_proj", "model.layers.50.mlp.experts.27.gate_proj", "model.layers.50.mlp.experts.28.gate_proj", "model.layers.50.mlp.experts.29.gate_proj", "model.layers.50.mlp.experts.30.gate_proj", "model.layers.50.mlp.experts.31.gate_proj", "model.layers.50.mlp.experts.32.gate_proj", "model.layers.50.mlp.experts.33.gate_proj", "model.layers.50.mlp.experts.34.gate_proj", "model.layers.50.mlp.experts.35.gate_proj", "model.layers.50.mlp.experts.36.gate_proj", "model.layers.50.mlp.experts.37.gate_proj", "model.layers.50.mlp.experts.38.gate_proj", "model.layers.50.mlp.experts.39.gate_proj", "model.layers.50.mlp.experts.40.gate_proj", "model.layers.50.mlp.experts.41.gate_proj", "model.layers.50.mlp.experts.42.gate_proj", "model.layers.50.mlp.experts.43.gate_proj", "model.layers.50.mlp.experts.44.gate_proj", "model.layers.50.mlp.experts.45.gate_proj", "model.layers.50.mlp.experts.46.gate_proj", "model.layers.50.mlp.experts.47.gate_proj", "model.layers.50.mlp.experts.48.gate_proj", "model.layers.50.mlp.experts.49.gate_proj", "model.layers.50.mlp.experts.50.gate_proj", "model.layers.50.mlp.experts.51.gate_proj", "model.layers.50.mlp.experts.52.gate_proj", "model.layers.50.mlp.experts.53.gate_proj", "model.layers.50.mlp.experts.54.gate_proj", "model.layers.50.mlp.experts.55.gate_proj", "model.layers.50.mlp.experts.56.gate_proj", "model.layers.50.mlp.experts.57.gate_proj", "model.layers.50.mlp.experts.58.gate_proj", "model.layers.50.mlp.experts.59.gate_proj", "model.layers.50.mlp.experts.60.gate_proj", "model.layers.50.mlp.experts.61.gate_proj", "model.layers.50.mlp.experts.62.gate_proj", "model.layers.50.mlp.experts.63.gate_proj", "model.layers.50.mlp.experts.64.gate_proj", "model.layers.50.mlp.experts.65.gate_proj", "model.layers.50.mlp.experts.66.gate_proj", "model.layers.50.mlp.experts.67.gate_proj", "model.layers.50.mlp.experts.68.gate_proj", "model.layers.50.mlp.experts.69.gate_proj", "model.layers.50.mlp.experts.70.gate_proj", "model.layers.50.mlp.experts.71.gate_proj", "model.layers.50.mlp.experts.72.gate_proj", "model.layers.50.mlp.experts.73.gate_proj", "model.layers.50.mlp.experts.74.gate_proj", "model.layers.50.mlp.experts.75.gate_proj", "model.layers.50.mlp.experts.76.gate_proj", "model.layers.50.mlp.experts.77.gate_proj", "model.layers.50.mlp.experts.78.gate_proj", "model.layers.50.mlp.experts.79.gate_proj", "model.layers.50.mlp.experts.80.gate_proj", "model.layers.50.mlp.experts.81.gate_proj", "model.layers.50.mlp.experts.82.gate_proj", "model.layers.50.mlp.experts.83.gate_proj", "model.layers.50.mlp.experts.84.gate_proj", "model.layers.50.mlp.experts.85.gate_proj", "model.layers.50.mlp.experts.86.gate_proj", "model.layers.50.mlp.experts.87.gate_proj", "model.layers.50.mlp.experts.88.gate_proj", "model.layers.50.mlp.experts.89.gate_proj", "model.layers.50.mlp.experts.90.gate_proj", "model.layers.50.mlp.experts.91.gate_proj", "model.layers.50.mlp.experts.92.gate_proj", "model.layers.50.mlp.experts.93.gate_proj", "model.layers.50.mlp.experts.94.gate_proj", "model.layers.50.mlp.experts.95.gate_proj", "model.layers.50.mlp.experts.96.gate_proj", "model.layers.50.mlp.experts.97.gate_proj", "model.layers.50.mlp.experts.98.gate_proj", "model.layers.50.mlp.experts.99.gate_proj", "model.layers.50.mlp.experts.100.gate_proj", "model.layers.50.mlp.experts.101.gate_proj", "model.layers.50.mlp.experts.102.gate_proj", "model.layers.50.mlp.experts.103.gate_proj", "model.layers.50.mlp.experts.104.gate_proj", "model.layers.50.mlp.experts.105.gate_proj", "model.layers.50.mlp.experts.106.gate_proj", "model.layers.50.mlp.experts.107.gate_proj", "model.layers.50.mlp.experts.108.gate_proj", "model.layers.50.mlp.experts.109.gate_proj", "model.layers.50.mlp.experts.110.gate_proj", "model.layers.50.mlp.experts.111.gate_proj", "model.layers.50.mlp.experts.112.gate_proj", "model.layers.50.mlp.experts.113.gate_proj", "model.layers.50.mlp.experts.114.gate_proj", "model.layers.50.mlp.experts.115.gate_proj", "model.layers.50.mlp.experts.116.gate_proj", "model.layers.50.mlp.experts.117.gate_proj", "model.layers.50.mlp.experts.118.gate_proj", "model.layers.50.mlp.experts.119.gate_proj", "model.layers.50.mlp.experts.120.gate_proj", "model.layers.50.mlp.experts.121.gate_proj", "model.layers.50.mlp.experts.122.gate_proj", "model.layers.50.mlp.experts.123.gate_proj", "model.layers.50.mlp.experts.124.gate_proj", "model.layers.50.mlp.experts.125.gate_proj", "model.layers.50.mlp.experts.126.gate_proj", "model.layers.50.mlp.experts.127.gate_proj", "model.layers.50.mlp.experts.128.gate_proj", "model.layers.50.mlp.experts.129.gate_proj", "model.layers.50.mlp.experts.130.gate_proj", "model.layers.50.mlp.experts.131.gate_proj", "model.layers.50.mlp.experts.132.gate_proj", "model.layers.50.mlp.experts.133.gate_proj", "model.layers.50.mlp.experts.134.gate_proj", "model.layers.50.mlp.experts.135.gate_proj", "model.layers.50.mlp.experts.136.gate_proj", "model.layers.50.mlp.experts.137.gate_proj", "model.layers.50.mlp.experts.138.gate_proj", "model.layers.50.mlp.experts.139.gate_proj", "model.layers.50.mlp.experts.140.gate_proj", "model.layers.50.mlp.experts.141.gate_proj", "model.layers.50.mlp.experts.142.gate_proj", "model.layers.50.mlp.experts.143.gate_proj", "model.layers.50.mlp.experts.144.gate_proj", "model.layers.50.mlp.experts.145.gate_proj", "model.layers.50.mlp.experts.146.gate_proj", "model.layers.50.mlp.experts.147.gate_proj", "model.layers.50.mlp.experts.148.gate_proj", "model.layers.50.mlp.experts.149.gate_proj", "model.layers.50.mlp.experts.150.gate_proj", "model.layers.50.mlp.experts.151.gate_proj", "model.layers.50.mlp.experts.152.gate_proj", "model.layers.50.mlp.experts.153.gate_proj", "model.layers.50.mlp.experts.154.gate_proj", "model.layers.50.mlp.experts.155.gate_proj", "model.layers.50.mlp.experts.156.gate_proj", "model.layers.50.mlp.experts.157.gate_proj", "model.layers.50.mlp.experts.158.gate_proj", "model.layers.50.mlp.experts.159.gate_proj", "model.layers.50.mlp.experts.0.up_proj", "model.layers.50.mlp.experts.1.up_proj", "model.layers.50.mlp.experts.2.up_proj", "model.layers.50.mlp.experts.3.up_proj", "model.layers.50.mlp.experts.4.up_proj", "model.layers.50.mlp.experts.5.up_proj", "model.layers.50.mlp.experts.6.up_proj", "model.layers.50.mlp.experts.7.up_proj", "model.layers.50.mlp.experts.8.up_proj", "model.layers.50.mlp.experts.9.up_proj", "model.layers.50.mlp.experts.10.up_proj", "model.layers.50.mlp.experts.11.up_proj", "model.layers.50.mlp.experts.12.up_proj", "model.layers.50.mlp.experts.13.up_proj", "model.layers.50.mlp.experts.14.up_proj", "model.layers.50.mlp.experts.15.up_proj", "model.layers.50.mlp.experts.16.up_proj", "model.layers.50.mlp.experts.17.up_proj", "model.layers.50.mlp.experts.18.up_proj", "model.layers.50.mlp.experts.19.up_proj", "model.layers.50.mlp.experts.20.up_proj", "model.layers.50.mlp.experts.21.up_proj", "model.layers.50.mlp.experts.22.up_proj", "model.layers.50.mlp.experts.23.up_proj", "model.layers.50.mlp.experts.24.up_proj", "model.layers.50.mlp.experts.25.up_proj", "model.layers.50.mlp.experts.26.up_proj", "model.layers.50.mlp.experts.27.up_proj", "model.layers.50.mlp.experts.28.up_proj", "model.layers.50.mlp.experts.29.up_proj", "model.layers.50.mlp.experts.30.up_proj", "model.layers.50.mlp.experts.31.up_proj", "model.layers.50.mlp.experts.32.up_proj", "model.layers.50.mlp.experts.33.up_proj", "model.layers.50.mlp.experts.34.up_proj", "model.layers.50.mlp.experts.35.up_proj", "model.layers.50.mlp.experts.36.up_proj", "model.layers.50.mlp.experts.37.up_proj", "model.layers.50.mlp.experts.38.up_proj", "model.layers.50.mlp.experts.39.up_proj", "model.layers.50.mlp.experts.40.up_proj", "model.layers.50.mlp.experts.41.up_proj", "model.layers.50.mlp.experts.42.up_proj", "model.layers.50.mlp.experts.43.up_proj", "model.layers.50.mlp.experts.44.up_proj", "model.layers.50.mlp.experts.45.up_proj", "model.layers.50.mlp.experts.46.up_proj", "model.layers.50.mlp.experts.47.up_proj", "model.layers.50.mlp.experts.48.up_proj", "model.layers.50.mlp.experts.49.up_proj", "model.layers.50.mlp.experts.50.up_proj", "model.layers.50.mlp.experts.51.up_proj", "model.layers.50.mlp.experts.52.up_proj", "model.layers.50.mlp.experts.53.up_proj", "model.layers.50.mlp.experts.54.up_proj", "model.layers.50.mlp.experts.55.up_proj", "model.layers.50.mlp.experts.56.up_proj", "model.layers.50.mlp.experts.57.up_proj", "model.layers.50.mlp.experts.58.up_proj", "model.layers.50.mlp.experts.59.up_proj", "model.layers.50.mlp.experts.60.up_proj", "model.layers.50.mlp.experts.61.up_proj", "model.layers.50.mlp.experts.62.up_proj", "model.layers.50.mlp.experts.63.up_proj", "model.layers.50.mlp.experts.64.up_proj", "model.layers.50.mlp.experts.65.up_proj", "model.layers.50.mlp.experts.66.up_proj", "model.layers.50.mlp.experts.67.up_proj", "model.layers.50.mlp.experts.68.up_proj", "model.layers.50.mlp.experts.69.up_proj", "model.layers.50.mlp.experts.70.up_proj", "model.layers.50.mlp.experts.71.up_proj", "model.layers.50.mlp.experts.72.up_proj", "model.layers.50.mlp.experts.73.up_proj", "model.layers.50.mlp.experts.74.up_proj", "model.layers.50.mlp.experts.75.up_proj", "model.layers.50.mlp.experts.76.up_proj", "model.layers.50.mlp.experts.77.up_proj", "model.layers.50.mlp.experts.78.up_proj", "model.layers.50.mlp.experts.79.up_proj", "model.layers.50.mlp.experts.80.up_proj", "model.layers.50.mlp.experts.81.up_proj", "model.layers.50.mlp.experts.82.up_proj", "model.layers.50.mlp.experts.83.up_proj", "model.layers.50.mlp.experts.84.up_proj", "model.layers.50.mlp.experts.85.up_proj", "model.layers.50.mlp.experts.86.up_proj", "model.layers.50.mlp.experts.87.up_proj", "model.layers.50.mlp.experts.88.up_proj", "model.layers.50.mlp.experts.89.up_proj", "model.layers.50.mlp.experts.90.up_proj", "model.layers.50.mlp.experts.91.up_proj", "model.layers.50.mlp.experts.92.up_proj", "model.layers.50.mlp.experts.93.up_proj", "model.layers.50.mlp.experts.94.up_proj", "model.layers.50.mlp.experts.95.up_proj", "model.layers.50.mlp.experts.96.up_proj", "model.layers.50.mlp.experts.97.up_proj", "model.layers.50.mlp.experts.98.up_proj", "model.layers.50.mlp.experts.99.up_proj", "model.layers.50.mlp.experts.100.up_proj", "model.layers.50.mlp.experts.101.up_proj", "model.layers.50.mlp.experts.102.up_proj", "model.layers.50.mlp.experts.103.up_proj", "model.layers.50.mlp.experts.104.up_proj", "model.layers.50.mlp.experts.105.up_proj", "model.layers.50.mlp.experts.106.up_proj", "model.layers.50.mlp.experts.107.up_proj", "model.layers.50.mlp.experts.108.up_proj", "model.layers.50.mlp.experts.109.up_proj", "model.layers.50.mlp.experts.110.up_proj", "model.layers.50.mlp.experts.111.up_proj", "model.layers.50.mlp.experts.112.up_proj", "model.layers.50.mlp.experts.113.up_proj", "model.layers.50.mlp.experts.114.up_proj", "model.layers.50.mlp.experts.115.up_proj", "model.layers.50.mlp.experts.116.up_proj", "model.layers.50.mlp.experts.117.up_proj", "model.layers.50.mlp.experts.118.up_proj", "model.layers.50.mlp.experts.119.up_proj", "model.layers.50.mlp.experts.120.up_proj", "model.layers.50.mlp.experts.121.up_proj", "model.layers.50.mlp.experts.122.up_proj", "model.layers.50.mlp.experts.123.up_proj", "model.layers.50.mlp.experts.124.up_proj", "model.layers.50.mlp.experts.125.up_proj", "model.layers.50.mlp.experts.126.up_proj", "model.layers.50.mlp.experts.127.up_proj", "model.layers.50.mlp.experts.128.up_proj", "model.layers.50.mlp.experts.129.up_proj", "model.layers.50.mlp.experts.130.up_proj", "model.layers.50.mlp.experts.131.up_proj", "model.layers.50.mlp.experts.132.up_proj", "model.layers.50.mlp.experts.133.up_proj", "model.layers.50.mlp.experts.134.up_proj", "model.layers.50.mlp.experts.135.up_proj", "model.layers.50.mlp.experts.136.up_proj", "model.layers.50.mlp.experts.137.up_proj", "model.layers.50.mlp.experts.138.up_proj", "model.layers.50.mlp.experts.139.up_proj", "model.layers.50.mlp.experts.140.up_proj", "model.layers.50.mlp.experts.141.up_proj", "model.layers.50.mlp.experts.142.up_proj", "model.layers.50.mlp.experts.143.up_proj", "model.layers.50.mlp.experts.144.up_proj", "model.layers.50.mlp.experts.145.up_proj", "model.layers.50.mlp.experts.146.up_proj", "model.layers.50.mlp.experts.147.up_proj", "model.layers.50.mlp.experts.148.up_proj", "model.layers.50.mlp.experts.149.up_proj", "model.layers.50.mlp.experts.150.up_proj", "model.layers.50.mlp.experts.151.up_proj", "model.layers.50.mlp.experts.152.up_proj", "model.layers.50.mlp.experts.153.up_proj", "model.layers.50.mlp.experts.154.up_proj", "model.layers.50.mlp.experts.155.up_proj", "model.layers.50.mlp.experts.156.up_proj", "model.layers.50.mlp.experts.157.up_proj", "model.layers.50.mlp.experts.158.up_proj", "model.layers.50.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -4.136958159506321e-05, "dbits": 2516582400 }, { "dkld": -3.748205490410224e-05, "dbits": 5033164800 } ] }, { "idx": 302, "layers": [ "model.layers.50.mlp.experts.0.down_proj", "model.layers.50.mlp.experts.1.down_proj", "model.layers.50.mlp.experts.2.down_proj", "model.layers.50.mlp.experts.3.down_proj", "model.layers.50.mlp.experts.4.down_proj", "model.layers.50.mlp.experts.5.down_proj", "model.layers.50.mlp.experts.6.down_proj", "model.layers.50.mlp.experts.7.down_proj", "model.layers.50.mlp.experts.8.down_proj", "model.layers.50.mlp.experts.9.down_proj", "model.layers.50.mlp.experts.10.down_proj", "model.layers.50.mlp.experts.11.down_proj", "model.layers.50.mlp.experts.12.down_proj", "model.layers.50.mlp.experts.13.down_proj", "model.layers.50.mlp.experts.14.down_proj", "model.layers.50.mlp.experts.15.down_proj", "model.layers.50.mlp.experts.16.down_proj", "model.layers.50.mlp.experts.17.down_proj", "model.layers.50.mlp.experts.18.down_proj", "model.layers.50.mlp.experts.19.down_proj", "model.layers.50.mlp.experts.20.down_proj", "model.layers.50.mlp.experts.21.down_proj", "model.layers.50.mlp.experts.22.down_proj", "model.layers.50.mlp.experts.23.down_proj", "model.layers.50.mlp.experts.24.down_proj", "model.layers.50.mlp.experts.25.down_proj", "model.layers.50.mlp.experts.26.down_proj", "model.layers.50.mlp.experts.27.down_proj", "model.layers.50.mlp.experts.28.down_proj", "model.layers.50.mlp.experts.29.down_proj", "model.layers.50.mlp.experts.30.down_proj", "model.layers.50.mlp.experts.31.down_proj", "model.layers.50.mlp.experts.32.down_proj", "model.layers.50.mlp.experts.33.down_proj", "model.layers.50.mlp.experts.34.down_proj", "model.layers.50.mlp.experts.35.down_proj", "model.layers.50.mlp.experts.36.down_proj", "model.layers.50.mlp.experts.37.down_proj", "model.layers.50.mlp.experts.38.down_proj", "model.layers.50.mlp.experts.39.down_proj", "model.layers.50.mlp.experts.40.down_proj", "model.layers.50.mlp.experts.41.down_proj", "model.layers.50.mlp.experts.42.down_proj", "model.layers.50.mlp.experts.43.down_proj", "model.layers.50.mlp.experts.44.down_proj", "model.layers.50.mlp.experts.45.down_proj", "model.layers.50.mlp.experts.46.down_proj", "model.layers.50.mlp.experts.47.down_proj", "model.layers.50.mlp.experts.48.down_proj", "model.layers.50.mlp.experts.49.down_proj", "model.layers.50.mlp.experts.50.down_proj", "model.layers.50.mlp.experts.51.down_proj", "model.layers.50.mlp.experts.52.down_proj", "model.layers.50.mlp.experts.53.down_proj", "model.layers.50.mlp.experts.54.down_proj", "model.layers.50.mlp.experts.55.down_proj", "model.layers.50.mlp.experts.56.down_proj", "model.layers.50.mlp.experts.57.down_proj", "model.layers.50.mlp.experts.58.down_proj", "model.layers.50.mlp.experts.59.down_proj", "model.layers.50.mlp.experts.60.down_proj", "model.layers.50.mlp.experts.61.down_proj", "model.layers.50.mlp.experts.62.down_proj", "model.layers.50.mlp.experts.63.down_proj", "model.layers.50.mlp.experts.64.down_proj", "model.layers.50.mlp.experts.65.down_proj", "model.layers.50.mlp.experts.66.down_proj", "model.layers.50.mlp.experts.67.down_proj", "model.layers.50.mlp.experts.68.down_proj", "model.layers.50.mlp.experts.69.down_proj", "model.layers.50.mlp.experts.70.down_proj", "model.layers.50.mlp.experts.71.down_proj", "model.layers.50.mlp.experts.72.down_proj", "model.layers.50.mlp.experts.73.down_proj", "model.layers.50.mlp.experts.74.down_proj", "model.layers.50.mlp.experts.75.down_proj", "model.layers.50.mlp.experts.76.down_proj", "model.layers.50.mlp.experts.77.down_proj", "model.layers.50.mlp.experts.78.down_proj", "model.layers.50.mlp.experts.79.down_proj", "model.layers.50.mlp.experts.80.down_proj", "model.layers.50.mlp.experts.81.down_proj", "model.layers.50.mlp.experts.82.down_proj", "model.layers.50.mlp.experts.83.down_proj", "model.layers.50.mlp.experts.84.down_proj", "model.layers.50.mlp.experts.85.down_proj", "model.layers.50.mlp.experts.86.down_proj", "model.layers.50.mlp.experts.87.down_proj", "model.layers.50.mlp.experts.88.down_proj", "model.layers.50.mlp.experts.89.down_proj", "model.layers.50.mlp.experts.90.down_proj", "model.layers.50.mlp.experts.91.down_proj", "model.layers.50.mlp.experts.92.down_proj", "model.layers.50.mlp.experts.93.down_proj", "model.layers.50.mlp.experts.94.down_proj", "model.layers.50.mlp.experts.95.down_proj", "model.layers.50.mlp.experts.96.down_proj", "model.layers.50.mlp.experts.97.down_proj", "model.layers.50.mlp.experts.98.down_proj", "model.layers.50.mlp.experts.99.down_proj", "model.layers.50.mlp.experts.100.down_proj", "model.layers.50.mlp.experts.101.down_proj", "model.layers.50.mlp.experts.102.down_proj", "model.layers.50.mlp.experts.103.down_proj", "model.layers.50.mlp.experts.104.down_proj", "model.layers.50.mlp.experts.105.down_proj", "model.layers.50.mlp.experts.106.down_proj", "model.layers.50.mlp.experts.107.down_proj", "model.layers.50.mlp.experts.108.down_proj", "model.layers.50.mlp.experts.109.down_proj", "model.layers.50.mlp.experts.110.down_proj", "model.layers.50.mlp.experts.111.down_proj", "model.layers.50.mlp.experts.112.down_proj", "model.layers.50.mlp.experts.113.down_proj", "model.layers.50.mlp.experts.114.down_proj", "model.layers.50.mlp.experts.115.down_proj", "model.layers.50.mlp.experts.116.down_proj", "model.layers.50.mlp.experts.117.down_proj", "model.layers.50.mlp.experts.118.down_proj", "model.layers.50.mlp.experts.119.down_proj", "model.layers.50.mlp.experts.120.down_proj", "model.layers.50.mlp.experts.121.down_proj", "model.layers.50.mlp.experts.122.down_proj", "model.layers.50.mlp.experts.123.down_proj", "model.layers.50.mlp.experts.124.down_proj", "model.layers.50.mlp.experts.125.down_proj", "model.layers.50.mlp.experts.126.down_proj", "model.layers.50.mlp.experts.127.down_proj", "model.layers.50.mlp.experts.128.down_proj", "model.layers.50.mlp.experts.129.down_proj", "model.layers.50.mlp.experts.130.down_proj", "model.layers.50.mlp.experts.131.down_proj", "model.layers.50.mlp.experts.132.down_proj", "model.layers.50.mlp.experts.133.down_proj", "model.layers.50.mlp.experts.134.down_proj", "model.layers.50.mlp.experts.135.down_proj", "model.layers.50.mlp.experts.136.down_proj", "model.layers.50.mlp.experts.137.down_proj", "model.layers.50.mlp.experts.138.down_proj", "model.layers.50.mlp.experts.139.down_proj", "model.layers.50.mlp.experts.140.down_proj", "model.layers.50.mlp.experts.141.down_proj", "model.layers.50.mlp.experts.142.down_proj", "model.layers.50.mlp.experts.143.down_proj", "model.layers.50.mlp.experts.144.down_proj", "model.layers.50.mlp.experts.145.down_proj", "model.layers.50.mlp.experts.146.down_proj", "model.layers.50.mlp.experts.147.down_proj", "model.layers.50.mlp.experts.148.down_proj", "model.layers.50.mlp.experts.149.down_proj", "model.layers.50.mlp.experts.150.down_proj", "model.layers.50.mlp.experts.151.down_proj", "model.layers.50.mlp.experts.152.down_proj", "model.layers.50.mlp.experts.153.down_proj", "model.layers.50.mlp.experts.154.down_proj", "model.layers.50.mlp.experts.155.down_proj", "model.layers.50.mlp.experts.156.down_proj", "model.layers.50.mlp.experts.157.down_proj", "model.layers.50.mlp.experts.158.down_proj", "model.layers.50.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 9.771180339158969e-06, "dbits": 1258291200 }, { "dkld": -4.954217001794728e-06, "dbits": 2516582400 } ] }, { "idx": 303, "layers": [ "model.layers.51.self_attn.q_proj" ], "candidates": [ { "dkld": -3.214250318704648e-06, "dbits": 62914560 }, { "dkld": 1.092453021556139e-05, "dbits": 125829120 } ] }, { "idx": 304, "layers": [ "model.layers.51.self_attn.k_proj", "model.layers.51.self_attn.v_proj" ], "candidates": [ { "dkld": -1.5653320588171482e-05, "dbits": 10485760 }, { "dkld": -5.991628859192133e-05, "dbits": 20971520 } ] }, { "idx": 305, "layers": [ "model.layers.51.self_attn.o_proj" ], "candidates": [ { "dkld": 6.211025174707174e-05, "dbits": 62914560 }, { "dkld": 5.432788748294115e-05, "dbits": 125829120 } ] }, { "idx": 306, "layers": [ "model.layers.51.mlp.shared_experts.gate_proj", "model.layers.51.mlp.shared_experts.up_proj", "model.layers.51.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -4.9083703197538506e-05, "dbits": 23592960 }, { "dkld": -3.604218363761902e-05, "dbits": 47185920 } ] }, { "idx": 307, "layers": [ "model.layers.51.mlp.experts.0.gate_proj", "model.layers.51.mlp.experts.1.gate_proj", "model.layers.51.mlp.experts.2.gate_proj", "model.layers.51.mlp.experts.3.gate_proj", "model.layers.51.mlp.experts.4.gate_proj", "model.layers.51.mlp.experts.5.gate_proj", "model.layers.51.mlp.experts.6.gate_proj", "model.layers.51.mlp.experts.7.gate_proj", "model.layers.51.mlp.experts.8.gate_proj", "model.layers.51.mlp.experts.9.gate_proj", "model.layers.51.mlp.experts.10.gate_proj", "model.layers.51.mlp.experts.11.gate_proj", "model.layers.51.mlp.experts.12.gate_proj", "model.layers.51.mlp.experts.13.gate_proj", "model.layers.51.mlp.experts.14.gate_proj", "model.layers.51.mlp.experts.15.gate_proj", "model.layers.51.mlp.experts.16.gate_proj", "model.layers.51.mlp.experts.17.gate_proj", "model.layers.51.mlp.experts.18.gate_proj", "model.layers.51.mlp.experts.19.gate_proj", "model.layers.51.mlp.experts.20.gate_proj", "model.layers.51.mlp.experts.21.gate_proj", "model.layers.51.mlp.experts.22.gate_proj", "model.layers.51.mlp.experts.23.gate_proj", "model.layers.51.mlp.experts.24.gate_proj", "model.layers.51.mlp.experts.25.gate_proj", "model.layers.51.mlp.experts.26.gate_proj", "model.layers.51.mlp.experts.27.gate_proj", "model.layers.51.mlp.experts.28.gate_proj", "model.layers.51.mlp.experts.29.gate_proj", "model.layers.51.mlp.experts.30.gate_proj", "model.layers.51.mlp.experts.31.gate_proj", "model.layers.51.mlp.experts.32.gate_proj", "model.layers.51.mlp.experts.33.gate_proj", "model.layers.51.mlp.experts.34.gate_proj", "model.layers.51.mlp.experts.35.gate_proj", "model.layers.51.mlp.experts.36.gate_proj", "model.layers.51.mlp.experts.37.gate_proj", "model.layers.51.mlp.experts.38.gate_proj", "model.layers.51.mlp.experts.39.gate_proj", "model.layers.51.mlp.experts.40.gate_proj", "model.layers.51.mlp.experts.41.gate_proj", "model.layers.51.mlp.experts.42.gate_proj", "model.layers.51.mlp.experts.43.gate_proj", "model.layers.51.mlp.experts.44.gate_proj", "model.layers.51.mlp.experts.45.gate_proj", "model.layers.51.mlp.experts.46.gate_proj", "model.layers.51.mlp.experts.47.gate_proj", "model.layers.51.mlp.experts.48.gate_proj", "model.layers.51.mlp.experts.49.gate_proj", "model.layers.51.mlp.experts.50.gate_proj", "model.layers.51.mlp.experts.51.gate_proj", "model.layers.51.mlp.experts.52.gate_proj", "model.layers.51.mlp.experts.53.gate_proj", "model.layers.51.mlp.experts.54.gate_proj", "model.layers.51.mlp.experts.55.gate_proj", "model.layers.51.mlp.experts.56.gate_proj", "model.layers.51.mlp.experts.57.gate_proj", "model.layers.51.mlp.experts.58.gate_proj", "model.layers.51.mlp.experts.59.gate_proj", "model.layers.51.mlp.experts.60.gate_proj", "model.layers.51.mlp.experts.61.gate_proj", "model.layers.51.mlp.experts.62.gate_proj", "model.layers.51.mlp.experts.63.gate_proj", "model.layers.51.mlp.experts.64.gate_proj", "model.layers.51.mlp.experts.65.gate_proj", "model.layers.51.mlp.experts.66.gate_proj", "model.layers.51.mlp.experts.67.gate_proj", "model.layers.51.mlp.experts.68.gate_proj", "model.layers.51.mlp.experts.69.gate_proj", "model.layers.51.mlp.experts.70.gate_proj", "model.layers.51.mlp.experts.71.gate_proj", "model.layers.51.mlp.experts.72.gate_proj", "model.layers.51.mlp.experts.73.gate_proj", "model.layers.51.mlp.experts.74.gate_proj", "model.layers.51.mlp.experts.75.gate_proj", "model.layers.51.mlp.experts.76.gate_proj", "model.layers.51.mlp.experts.77.gate_proj", "model.layers.51.mlp.experts.78.gate_proj", "model.layers.51.mlp.experts.79.gate_proj", "model.layers.51.mlp.experts.80.gate_proj", "model.layers.51.mlp.experts.81.gate_proj", "model.layers.51.mlp.experts.82.gate_proj", "model.layers.51.mlp.experts.83.gate_proj", "model.layers.51.mlp.experts.84.gate_proj", "model.layers.51.mlp.experts.85.gate_proj", "model.layers.51.mlp.experts.86.gate_proj", "model.layers.51.mlp.experts.87.gate_proj", "model.layers.51.mlp.experts.88.gate_proj", "model.layers.51.mlp.experts.89.gate_proj", "model.layers.51.mlp.experts.90.gate_proj", "model.layers.51.mlp.experts.91.gate_proj", "model.layers.51.mlp.experts.92.gate_proj", "model.layers.51.mlp.experts.93.gate_proj", "model.layers.51.mlp.experts.94.gate_proj", "model.layers.51.mlp.experts.95.gate_proj", "model.layers.51.mlp.experts.96.gate_proj", "model.layers.51.mlp.experts.97.gate_proj", "model.layers.51.mlp.experts.98.gate_proj", "model.layers.51.mlp.experts.99.gate_proj", "model.layers.51.mlp.experts.100.gate_proj", "model.layers.51.mlp.experts.101.gate_proj", "model.layers.51.mlp.experts.102.gate_proj", "model.layers.51.mlp.experts.103.gate_proj", "model.layers.51.mlp.experts.104.gate_proj", "model.layers.51.mlp.experts.105.gate_proj", "model.layers.51.mlp.experts.106.gate_proj", "model.layers.51.mlp.experts.107.gate_proj", "model.layers.51.mlp.experts.108.gate_proj", "model.layers.51.mlp.experts.109.gate_proj", "model.layers.51.mlp.experts.110.gate_proj", "model.layers.51.mlp.experts.111.gate_proj", "model.layers.51.mlp.experts.112.gate_proj", "model.layers.51.mlp.experts.113.gate_proj", "model.layers.51.mlp.experts.114.gate_proj", "model.layers.51.mlp.experts.115.gate_proj", "model.layers.51.mlp.experts.116.gate_proj", "model.layers.51.mlp.experts.117.gate_proj", "model.layers.51.mlp.experts.118.gate_proj", "model.layers.51.mlp.experts.119.gate_proj", "model.layers.51.mlp.experts.120.gate_proj", "model.layers.51.mlp.experts.121.gate_proj", "model.layers.51.mlp.experts.122.gate_proj", "model.layers.51.mlp.experts.123.gate_proj", "model.layers.51.mlp.experts.124.gate_proj", "model.layers.51.mlp.experts.125.gate_proj", "model.layers.51.mlp.experts.126.gate_proj", "model.layers.51.mlp.experts.127.gate_proj", "model.layers.51.mlp.experts.128.gate_proj", "model.layers.51.mlp.experts.129.gate_proj", "model.layers.51.mlp.experts.130.gate_proj", "model.layers.51.mlp.experts.131.gate_proj", "model.layers.51.mlp.experts.132.gate_proj", "model.layers.51.mlp.experts.133.gate_proj", "model.layers.51.mlp.experts.134.gate_proj", "model.layers.51.mlp.experts.135.gate_proj", "model.layers.51.mlp.experts.136.gate_proj", "model.layers.51.mlp.experts.137.gate_proj", "model.layers.51.mlp.experts.138.gate_proj", "model.layers.51.mlp.experts.139.gate_proj", "model.layers.51.mlp.experts.140.gate_proj", "model.layers.51.mlp.experts.141.gate_proj", "model.layers.51.mlp.experts.142.gate_proj", "model.layers.51.mlp.experts.143.gate_proj", "model.layers.51.mlp.experts.144.gate_proj", "model.layers.51.mlp.experts.145.gate_proj", "model.layers.51.mlp.experts.146.gate_proj", "model.layers.51.mlp.experts.147.gate_proj", "model.layers.51.mlp.experts.148.gate_proj", "model.layers.51.mlp.experts.149.gate_proj", "model.layers.51.mlp.experts.150.gate_proj", "model.layers.51.mlp.experts.151.gate_proj", "model.layers.51.mlp.experts.152.gate_proj", "model.layers.51.mlp.experts.153.gate_proj", "model.layers.51.mlp.experts.154.gate_proj", "model.layers.51.mlp.experts.155.gate_proj", "model.layers.51.mlp.experts.156.gate_proj", "model.layers.51.mlp.experts.157.gate_proj", "model.layers.51.mlp.experts.158.gate_proj", "model.layers.51.mlp.experts.159.gate_proj", "model.layers.51.mlp.experts.0.up_proj", "model.layers.51.mlp.experts.1.up_proj", "model.layers.51.mlp.experts.2.up_proj", "model.layers.51.mlp.experts.3.up_proj", "model.layers.51.mlp.experts.4.up_proj", "model.layers.51.mlp.experts.5.up_proj", "model.layers.51.mlp.experts.6.up_proj", "model.layers.51.mlp.experts.7.up_proj", "model.layers.51.mlp.experts.8.up_proj", "model.layers.51.mlp.experts.9.up_proj", "model.layers.51.mlp.experts.10.up_proj", "model.layers.51.mlp.experts.11.up_proj", "model.layers.51.mlp.experts.12.up_proj", "model.layers.51.mlp.experts.13.up_proj", "model.layers.51.mlp.experts.14.up_proj", "model.layers.51.mlp.experts.15.up_proj", "model.layers.51.mlp.experts.16.up_proj", "model.layers.51.mlp.experts.17.up_proj", "model.layers.51.mlp.experts.18.up_proj", "model.layers.51.mlp.experts.19.up_proj", "model.layers.51.mlp.experts.20.up_proj", "model.layers.51.mlp.experts.21.up_proj", "model.layers.51.mlp.experts.22.up_proj", "model.layers.51.mlp.experts.23.up_proj", "model.layers.51.mlp.experts.24.up_proj", "model.layers.51.mlp.experts.25.up_proj", "model.layers.51.mlp.experts.26.up_proj", "model.layers.51.mlp.experts.27.up_proj", "model.layers.51.mlp.experts.28.up_proj", "model.layers.51.mlp.experts.29.up_proj", "model.layers.51.mlp.experts.30.up_proj", "model.layers.51.mlp.experts.31.up_proj", "model.layers.51.mlp.experts.32.up_proj", "model.layers.51.mlp.experts.33.up_proj", "model.layers.51.mlp.experts.34.up_proj", "model.layers.51.mlp.experts.35.up_proj", "model.layers.51.mlp.experts.36.up_proj", "model.layers.51.mlp.experts.37.up_proj", "model.layers.51.mlp.experts.38.up_proj", "model.layers.51.mlp.experts.39.up_proj", "model.layers.51.mlp.experts.40.up_proj", "model.layers.51.mlp.experts.41.up_proj", "model.layers.51.mlp.experts.42.up_proj", "model.layers.51.mlp.experts.43.up_proj", "model.layers.51.mlp.experts.44.up_proj", "model.layers.51.mlp.experts.45.up_proj", "model.layers.51.mlp.experts.46.up_proj", "model.layers.51.mlp.experts.47.up_proj", "model.layers.51.mlp.experts.48.up_proj", "model.layers.51.mlp.experts.49.up_proj", "model.layers.51.mlp.experts.50.up_proj", "model.layers.51.mlp.experts.51.up_proj", "model.layers.51.mlp.experts.52.up_proj", "model.layers.51.mlp.experts.53.up_proj", "model.layers.51.mlp.experts.54.up_proj", "model.layers.51.mlp.experts.55.up_proj", "model.layers.51.mlp.experts.56.up_proj", "model.layers.51.mlp.experts.57.up_proj", "model.layers.51.mlp.experts.58.up_proj", "model.layers.51.mlp.experts.59.up_proj", "model.layers.51.mlp.experts.60.up_proj", "model.layers.51.mlp.experts.61.up_proj", "model.layers.51.mlp.experts.62.up_proj", "model.layers.51.mlp.experts.63.up_proj", "model.layers.51.mlp.experts.64.up_proj", "model.layers.51.mlp.experts.65.up_proj", "model.layers.51.mlp.experts.66.up_proj", "model.layers.51.mlp.experts.67.up_proj", "model.layers.51.mlp.experts.68.up_proj", "model.layers.51.mlp.experts.69.up_proj", "model.layers.51.mlp.experts.70.up_proj", "model.layers.51.mlp.experts.71.up_proj", "model.layers.51.mlp.experts.72.up_proj", "model.layers.51.mlp.experts.73.up_proj", "model.layers.51.mlp.experts.74.up_proj", "model.layers.51.mlp.experts.75.up_proj", "model.layers.51.mlp.experts.76.up_proj", "model.layers.51.mlp.experts.77.up_proj", "model.layers.51.mlp.experts.78.up_proj", "model.layers.51.mlp.experts.79.up_proj", "model.layers.51.mlp.experts.80.up_proj", "model.layers.51.mlp.experts.81.up_proj", "model.layers.51.mlp.experts.82.up_proj", "model.layers.51.mlp.experts.83.up_proj", "model.layers.51.mlp.experts.84.up_proj", "model.layers.51.mlp.experts.85.up_proj", "model.layers.51.mlp.experts.86.up_proj", "model.layers.51.mlp.experts.87.up_proj", "model.layers.51.mlp.experts.88.up_proj", "model.layers.51.mlp.experts.89.up_proj", "model.layers.51.mlp.experts.90.up_proj", "model.layers.51.mlp.experts.91.up_proj", "model.layers.51.mlp.experts.92.up_proj", "model.layers.51.mlp.experts.93.up_proj", "model.layers.51.mlp.experts.94.up_proj", "model.layers.51.mlp.experts.95.up_proj", "model.layers.51.mlp.experts.96.up_proj", "model.layers.51.mlp.experts.97.up_proj", "model.layers.51.mlp.experts.98.up_proj", "model.layers.51.mlp.experts.99.up_proj", "model.layers.51.mlp.experts.100.up_proj", "model.layers.51.mlp.experts.101.up_proj", "model.layers.51.mlp.experts.102.up_proj", "model.layers.51.mlp.experts.103.up_proj", "model.layers.51.mlp.experts.104.up_proj", "model.layers.51.mlp.experts.105.up_proj", "model.layers.51.mlp.experts.106.up_proj", "model.layers.51.mlp.experts.107.up_proj", "model.layers.51.mlp.experts.108.up_proj", "model.layers.51.mlp.experts.109.up_proj", "model.layers.51.mlp.experts.110.up_proj", "model.layers.51.mlp.experts.111.up_proj", "model.layers.51.mlp.experts.112.up_proj", "model.layers.51.mlp.experts.113.up_proj", "model.layers.51.mlp.experts.114.up_proj", "model.layers.51.mlp.experts.115.up_proj", "model.layers.51.mlp.experts.116.up_proj", "model.layers.51.mlp.experts.117.up_proj", "model.layers.51.mlp.experts.118.up_proj", "model.layers.51.mlp.experts.119.up_proj", "model.layers.51.mlp.experts.120.up_proj", "model.layers.51.mlp.experts.121.up_proj", "model.layers.51.mlp.experts.122.up_proj", "model.layers.51.mlp.experts.123.up_proj", "model.layers.51.mlp.experts.124.up_proj", "model.layers.51.mlp.experts.125.up_proj", "model.layers.51.mlp.experts.126.up_proj", "model.layers.51.mlp.experts.127.up_proj", "model.layers.51.mlp.experts.128.up_proj", "model.layers.51.mlp.experts.129.up_proj", "model.layers.51.mlp.experts.130.up_proj", "model.layers.51.mlp.experts.131.up_proj", "model.layers.51.mlp.experts.132.up_proj", "model.layers.51.mlp.experts.133.up_proj", "model.layers.51.mlp.experts.134.up_proj", "model.layers.51.mlp.experts.135.up_proj", "model.layers.51.mlp.experts.136.up_proj", "model.layers.51.mlp.experts.137.up_proj", "model.layers.51.mlp.experts.138.up_proj", "model.layers.51.mlp.experts.139.up_proj", "model.layers.51.mlp.experts.140.up_proj", "model.layers.51.mlp.experts.141.up_proj", "model.layers.51.mlp.experts.142.up_proj", "model.layers.51.mlp.experts.143.up_proj", "model.layers.51.mlp.experts.144.up_proj", "model.layers.51.mlp.experts.145.up_proj", "model.layers.51.mlp.experts.146.up_proj", "model.layers.51.mlp.experts.147.up_proj", "model.layers.51.mlp.experts.148.up_proj", "model.layers.51.mlp.experts.149.up_proj", "model.layers.51.mlp.experts.150.up_proj", "model.layers.51.mlp.experts.151.up_proj", "model.layers.51.mlp.experts.152.up_proj", "model.layers.51.mlp.experts.153.up_proj", "model.layers.51.mlp.experts.154.up_proj", "model.layers.51.mlp.experts.155.up_proj", "model.layers.51.mlp.experts.156.up_proj", "model.layers.51.mlp.experts.157.up_proj", "model.layers.51.mlp.experts.158.up_proj", "model.layers.51.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.283005207777023e-05, "dbits": 2516582400 }, { "dkld": -3.912434913217952e-05, "dbits": 5033164800 } ] }, { "idx": 308, "layers": [ "model.layers.51.mlp.experts.0.down_proj", "model.layers.51.mlp.experts.1.down_proj", "model.layers.51.mlp.experts.2.down_proj", "model.layers.51.mlp.experts.3.down_proj", "model.layers.51.mlp.experts.4.down_proj", "model.layers.51.mlp.experts.5.down_proj", "model.layers.51.mlp.experts.6.down_proj", "model.layers.51.mlp.experts.7.down_proj", "model.layers.51.mlp.experts.8.down_proj", "model.layers.51.mlp.experts.9.down_proj", "model.layers.51.mlp.experts.10.down_proj", "model.layers.51.mlp.experts.11.down_proj", "model.layers.51.mlp.experts.12.down_proj", "model.layers.51.mlp.experts.13.down_proj", "model.layers.51.mlp.experts.14.down_proj", "model.layers.51.mlp.experts.15.down_proj", "model.layers.51.mlp.experts.16.down_proj", "model.layers.51.mlp.experts.17.down_proj", "model.layers.51.mlp.experts.18.down_proj", "model.layers.51.mlp.experts.19.down_proj", "model.layers.51.mlp.experts.20.down_proj", "model.layers.51.mlp.experts.21.down_proj", "model.layers.51.mlp.experts.22.down_proj", "model.layers.51.mlp.experts.23.down_proj", "model.layers.51.mlp.experts.24.down_proj", "model.layers.51.mlp.experts.25.down_proj", "model.layers.51.mlp.experts.26.down_proj", "model.layers.51.mlp.experts.27.down_proj", "model.layers.51.mlp.experts.28.down_proj", "model.layers.51.mlp.experts.29.down_proj", "model.layers.51.mlp.experts.30.down_proj", "model.layers.51.mlp.experts.31.down_proj", "model.layers.51.mlp.experts.32.down_proj", "model.layers.51.mlp.experts.33.down_proj", "model.layers.51.mlp.experts.34.down_proj", "model.layers.51.mlp.experts.35.down_proj", "model.layers.51.mlp.experts.36.down_proj", "model.layers.51.mlp.experts.37.down_proj", "model.layers.51.mlp.experts.38.down_proj", "model.layers.51.mlp.experts.39.down_proj", "model.layers.51.mlp.experts.40.down_proj", "model.layers.51.mlp.experts.41.down_proj", "model.layers.51.mlp.experts.42.down_proj", "model.layers.51.mlp.experts.43.down_proj", "model.layers.51.mlp.experts.44.down_proj", "model.layers.51.mlp.experts.45.down_proj", "model.layers.51.mlp.experts.46.down_proj", "model.layers.51.mlp.experts.47.down_proj", "model.layers.51.mlp.experts.48.down_proj", "model.layers.51.mlp.experts.49.down_proj", "model.layers.51.mlp.experts.50.down_proj", "model.layers.51.mlp.experts.51.down_proj", "model.layers.51.mlp.experts.52.down_proj", "model.layers.51.mlp.experts.53.down_proj", "model.layers.51.mlp.experts.54.down_proj", "model.layers.51.mlp.experts.55.down_proj", "model.layers.51.mlp.experts.56.down_proj", "model.layers.51.mlp.experts.57.down_proj", "model.layers.51.mlp.experts.58.down_proj", "model.layers.51.mlp.experts.59.down_proj", "model.layers.51.mlp.experts.60.down_proj", "model.layers.51.mlp.experts.61.down_proj", "model.layers.51.mlp.experts.62.down_proj", "model.layers.51.mlp.experts.63.down_proj", "model.layers.51.mlp.experts.64.down_proj", "model.layers.51.mlp.experts.65.down_proj", "model.layers.51.mlp.experts.66.down_proj", "model.layers.51.mlp.experts.67.down_proj", "model.layers.51.mlp.experts.68.down_proj", "model.layers.51.mlp.experts.69.down_proj", "model.layers.51.mlp.experts.70.down_proj", "model.layers.51.mlp.experts.71.down_proj", "model.layers.51.mlp.experts.72.down_proj", "model.layers.51.mlp.experts.73.down_proj", "model.layers.51.mlp.experts.74.down_proj", "model.layers.51.mlp.experts.75.down_proj", "model.layers.51.mlp.experts.76.down_proj", "model.layers.51.mlp.experts.77.down_proj", "model.layers.51.mlp.experts.78.down_proj", "model.layers.51.mlp.experts.79.down_proj", "model.layers.51.mlp.experts.80.down_proj", "model.layers.51.mlp.experts.81.down_proj", "model.layers.51.mlp.experts.82.down_proj", "model.layers.51.mlp.experts.83.down_proj", "model.layers.51.mlp.experts.84.down_proj", "model.layers.51.mlp.experts.85.down_proj", "model.layers.51.mlp.experts.86.down_proj", "model.layers.51.mlp.experts.87.down_proj", "model.layers.51.mlp.experts.88.down_proj", "model.layers.51.mlp.experts.89.down_proj", "model.layers.51.mlp.experts.90.down_proj", "model.layers.51.mlp.experts.91.down_proj", "model.layers.51.mlp.experts.92.down_proj", "model.layers.51.mlp.experts.93.down_proj", "model.layers.51.mlp.experts.94.down_proj", "model.layers.51.mlp.experts.95.down_proj", "model.layers.51.mlp.experts.96.down_proj", "model.layers.51.mlp.experts.97.down_proj", "model.layers.51.mlp.experts.98.down_proj", "model.layers.51.mlp.experts.99.down_proj", "model.layers.51.mlp.experts.100.down_proj", "model.layers.51.mlp.experts.101.down_proj", "model.layers.51.mlp.experts.102.down_proj", "model.layers.51.mlp.experts.103.down_proj", "model.layers.51.mlp.experts.104.down_proj", "model.layers.51.mlp.experts.105.down_proj", "model.layers.51.mlp.experts.106.down_proj", "model.layers.51.mlp.experts.107.down_proj", "model.layers.51.mlp.experts.108.down_proj", "model.layers.51.mlp.experts.109.down_proj", "model.layers.51.mlp.experts.110.down_proj", "model.layers.51.mlp.experts.111.down_proj", "model.layers.51.mlp.experts.112.down_proj", "model.layers.51.mlp.experts.113.down_proj", "model.layers.51.mlp.experts.114.down_proj", "model.layers.51.mlp.experts.115.down_proj", "model.layers.51.mlp.experts.116.down_proj", "model.layers.51.mlp.experts.117.down_proj", "model.layers.51.mlp.experts.118.down_proj", "model.layers.51.mlp.experts.119.down_proj", "model.layers.51.mlp.experts.120.down_proj", "model.layers.51.mlp.experts.121.down_proj", "model.layers.51.mlp.experts.122.down_proj", "model.layers.51.mlp.experts.123.down_proj", "model.layers.51.mlp.experts.124.down_proj", "model.layers.51.mlp.experts.125.down_proj", "model.layers.51.mlp.experts.126.down_proj", "model.layers.51.mlp.experts.127.down_proj", "model.layers.51.mlp.experts.128.down_proj", "model.layers.51.mlp.experts.129.down_proj", "model.layers.51.mlp.experts.130.down_proj", "model.layers.51.mlp.experts.131.down_proj", "model.layers.51.mlp.experts.132.down_proj", "model.layers.51.mlp.experts.133.down_proj", "model.layers.51.mlp.experts.134.down_proj", "model.layers.51.mlp.experts.135.down_proj", "model.layers.51.mlp.experts.136.down_proj", "model.layers.51.mlp.experts.137.down_proj", "model.layers.51.mlp.experts.138.down_proj", "model.layers.51.mlp.experts.139.down_proj", "model.layers.51.mlp.experts.140.down_proj", "model.layers.51.mlp.experts.141.down_proj", "model.layers.51.mlp.experts.142.down_proj", "model.layers.51.mlp.experts.143.down_proj", "model.layers.51.mlp.experts.144.down_proj", "model.layers.51.mlp.experts.145.down_proj", "model.layers.51.mlp.experts.146.down_proj", "model.layers.51.mlp.experts.147.down_proj", "model.layers.51.mlp.experts.148.down_proj", "model.layers.51.mlp.experts.149.down_proj", "model.layers.51.mlp.experts.150.down_proj", "model.layers.51.mlp.experts.151.down_proj", "model.layers.51.mlp.experts.152.down_proj", "model.layers.51.mlp.experts.153.down_proj", "model.layers.51.mlp.experts.154.down_proj", "model.layers.51.mlp.experts.155.down_proj", "model.layers.51.mlp.experts.156.down_proj", "model.layers.51.mlp.experts.157.down_proj", "model.layers.51.mlp.experts.158.down_proj", "model.layers.51.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 7.6160766184340395e-06, "dbits": 1258291200 }, { "dkld": -2.2277282550929936e-05, "dbits": 2516582400 } ] }, { "idx": 309, "layers": [ "model.layers.52.self_attn.q_proj" ], "candidates": [ { "dkld": 3.641520161181723e-05, "dbits": 62914560 }, { "dkld": -2.6741530746218073e-06, "dbits": 125829120 } ] }, { "idx": 310, "layers": [ "model.layers.52.self_attn.k_proj", "model.layers.52.self_attn.v_proj" ], "candidates": [ { "dkld": 0.00010253228247165784, "dbits": 10485760 }, { "dkld": 2.580559812486241e-05, "dbits": 20971520 } ] }, { "idx": 311, "layers": [ "model.layers.52.self_attn.o_proj" ], "candidates": [ { "dkld": -1.9780010916292667e-05, "dbits": 62914560 }, { "dkld": -3.810068592429057e-05, "dbits": 125829120 } ] }, { "idx": 312, "layers": [ "model.layers.52.mlp.shared_experts.gate_proj", "model.layers.52.mlp.shared_experts.up_proj", "model.layers.52.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -1.0089017450809479e-05, "dbits": 23592960 }, { "dkld": 4.5031774789094925e-06, "dbits": 47185920 } ] }, { "idx": 313, "layers": [ "model.layers.52.mlp.experts.0.gate_proj", "model.layers.52.mlp.experts.1.gate_proj", "model.layers.52.mlp.experts.2.gate_proj", "model.layers.52.mlp.experts.3.gate_proj", "model.layers.52.mlp.experts.4.gate_proj", "model.layers.52.mlp.experts.5.gate_proj", "model.layers.52.mlp.experts.6.gate_proj", "model.layers.52.mlp.experts.7.gate_proj", "model.layers.52.mlp.experts.8.gate_proj", "model.layers.52.mlp.experts.9.gate_proj", "model.layers.52.mlp.experts.10.gate_proj", "model.layers.52.mlp.experts.11.gate_proj", "model.layers.52.mlp.experts.12.gate_proj", "model.layers.52.mlp.experts.13.gate_proj", "model.layers.52.mlp.experts.14.gate_proj", "model.layers.52.mlp.experts.15.gate_proj", "model.layers.52.mlp.experts.16.gate_proj", "model.layers.52.mlp.experts.17.gate_proj", "model.layers.52.mlp.experts.18.gate_proj", "model.layers.52.mlp.experts.19.gate_proj", "model.layers.52.mlp.experts.20.gate_proj", "model.layers.52.mlp.experts.21.gate_proj", "model.layers.52.mlp.experts.22.gate_proj", "model.layers.52.mlp.experts.23.gate_proj", "model.layers.52.mlp.experts.24.gate_proj", "model.layers.52.mlp.experts.25.gate_proj", "model.layers.52.mlp.experts.26.gate_proj", "model.layers.52.mlp.experts.27.gate_proj", "model.layers.52.mlp.experts.28.gate_proj", "model.layers.52.mlp.experts.29.gate_proj", "model.layers.52.mlp.experts.30.gate_proj", "model.layers.52.mlp.experts.31.gate_proj", "model.layers.52.mlp.experts.32.gate_proj", "model.layers.52.mlp.experts.33.gate_proj", "model.layers.52.mlp.experts.34.gate_proj", "model.layers.52.mlp.experts.35.gate_proj", "model.layers.52.mlp.experts.36.gate_proj", "model.layers.52.mlp.experts.37.gate_proj", "model.layers.52.mlp.experts.38.gate_proj", "model.layers.52.mlp.experts.39.gate_proj", "model.layers.52.mlp.experts.40.gate_proj", "model.layers.52.mlp.experts.41.gate_proj", "model.layers.52.mlp.experts.42.gate_proj", "model.layers.52.mlp.experts.43.gate_proj", "model.layers.52.mlp.experts.44.gate_proj", "model.layers.52.mlp.experts.45.gate_proj", "model.layers.52.mlp.experts.46.gate_proj", "model.layers.52.mlp.experts.47.gate_proj", "model.layers.52.mlp.experts.48.gate_proj", "model.layers.52.mlp.experts.49.gate_proj", "model.layers.52.mlp.experts.50.gate_proj", "model.layers.52.mlp.experts.51.gate_proj", "model.layers.52.mlp.experts.52.gate_proj", "model.layers.52.mlp.experts.53.gate_proj", "model.layers.52.mlp.experts.54.gate_proj", "model.layers.52.mlp.experts.55.gate_proj", "model.layers.52.mlp.experts.56.gate_proj", "model.layers.52.mlp.experts.57.gate_proj", "model.layers.52.mlp.experts.58.gate_proj", "model.layers.52.mlp.experts.59.gate_proj", "model.layers.52.mlp.experts.60.gate_proj", "model.layers.52.mlp.experts.61.gate_proj", "model.layers.52.mlp.experts.62.gate_proj", "model.layers.52.mlp.experts.63.gate_proj", "model.layers.52.mlp.experts.64.gate_proj", "model.layers.52.mlp.experts.65.gate_proj", "model.layers.52.mlp.experts.66.gate_proj", "model.layers.52.mlp.experts.67.gate_proj", "model.layers.52.mlp.experts.68.gate_proj", "model.layers.52.mlp.experts.69.gate_proj", "model.layers.52.mlp.experts.70.gate_proj", "model.layers.52.mlp.experts.71.gate_proj", "model.layers.52.mlp.experts.72.gate_proj", "model.layers.52.mlp.experts.73.gate_proj", "model.layers.52.mlp.experts.74.gate_proj", "model.layers.52.mlp.experts.75.gate_proj", "model.layers.52.mlp.experts.76.gate_proj", "model.layers.52.mlp.experts.77.gate_proj", "model.layers.52.mlp.experts.78.gate_proj", "model.layers.52.mlp.experts.79.gate_proj", "model.layers.52.mlp.experts.80.gate_proj", "model.layers.52.mlp.experts.81.gate_proj", "model.layers.52.mlp.experts.82.gate_proj", "model.layers.52.mlp.experts.83.gate_proj", "model.layers.52.mlp.experts.84.gate_proj", "model.layers.52.mlp.experts.85.gate_proj", "model.layers.52.mlp.experts.86.gate_proj", "model.layers.52.mlp.experts.87.gate_proj", "model.layers.52.mlp.experts.88.gate_proj", "model.layers.52.mlp.experts.89.gate_proj", "model.layers.52.mlp.experts.90.gate_proj", "model.layers.52.mlp.experts.91.gate_proj", "model.layers.52.mlp.experts.92.gate_proj", "model.layers.52.mlp.experts.93.gate_proj", "model.layers.52.mlp.experts.94.gate_proj", "model.layers.52.mlp.experts.95.gate_proj", "model.layers.52.mlp.experts.96.gate_proj", "model.layers.52.mlp.experts.97.gate_proj", "model.layers.52.mlp.experts.98.gate_proj", "model.layers.52.mlp.experts.99.gate_proj", "model.layers.52.mlp.experts.100.gate_proj", "model.layers.52.mlp.experts.101.gate_proj", "model.layers.52.mlp.experts.102.gate_proj", "model.layers.52.mlp.experts.103.gate_proj", "model.layers.52.mlp.experts.104.gate_proj", "model.layers.52.mlp.experts.105.gate_proj", "model.layers.52.mlp.experts.106.gate_proj", "model.layers.52.mlp.experts.107.gate_proj", "model.layers.52.mlp.experts.108.gate_proj", "model.layers.52.mlp.experts.109.gate_proj", "model.layers.52.mlp.experts.110.gate_proj", "model.layers.52.mlp.experts.111.gate_proj", "model.layers.52.mlp.experts.112.gate_proj", "model.layers.52.mlp.experts.113.gate_proj", "model.layers.52.mlp.experts.114.gate_proj", "model.layers.52.mlp.experts.115.gate_proj", "model.layers.52.mlp.experts.116.gate_proj", "model.layers.52.mlp.experts.117.gate_proj", "model.layers.52.mlp.experts.118.gate_proj", "model.layers.52.mlp.experts.119.gate_proj", "model.layers.52.mlp.experts.120.gate_proj", "model.layers.52.mlp.experts.121.gate_proj", "model.layers.52.mlp.experts.122.gate_proj", "model.layers.52.mlp.experts.123.gate_proj", "model.layers.52.mlp.experts.124.gate_proj", "model.layers.52.mlp.experts.125.gate_proj", "model.layers.52.mlp.experts.126.gate_proj", "model.layers.52.mlp.experts.127.gate_proj", "model.layers.52.mlp.experts.128.gate_proj", "model.layers.52.mlp.experts.129.gate_proj", "model.layers.52.mlp.experts.130.gate_proj", "model.layers.52.mlp.experts.131.gate_proj", "model.layers.52.mlp.experts.132.gate_proj", "model.layers.52.mlp.experts.133.gate_proj", "model.layers.52.mlp.experts.134.gate_proj", "model.layers.52.mlp.experts.135.gate_proj", "model.layers.52.mlp.experts.136.gate_proj", "model.layers.52.mlp.experts.137.gate_proj", "model.layers.52.mlp.experts.138.gate_proj", "model.layers.52.mlp.experts.139.gate_proj", "model.layers.52.mlp.experts.140.gate_proj", "model.layers.52.mlp.experts.141.gate_proj", "model.layers.52.mlp.experts.142.gate_proj", "model.layers.52.mlp.experts.143.gate_proj", "model.layers.52.mlp.experts.144.gate_proj", "model.layers.52.mlp.experts.145.gate_proj", "model.layers.52.mlp.experts.146.gate_proj", "model.layers.52.mlp.experts.147.gate_proj", "model.layers.52.mlp.experts.148.gate_proj", "model.layers.52.mlp.experts.149.gate_proj", "model.layers.52.mlp.experts.150.gate_proj", "model.layers.52.mlp.experts.151.gate_proj", "model.layers.52.mlp.experts.152.gate_proj", "model.layers.52.mlp.experts.153.gate_proj", "model.layers.52.mlp.experts.154.gate_proj", "model.layers.52.mlp.experts.155.gate_proj", "model.layers.52.mlp.experts.156.gate_proj", "model.layers.52.mlp.experts.157.gate_proj", "model.layers.52.mlp.experts.158.gate_proj", "model.layers.52.mlp.experts.159.gate_proj", "model.layers.52.mlp.experts.0.up_proj", "model.layers.52.mlp.experts.1.up_proj", "model.layers.52.mlp.experts.2.up_proj", "model.layers.52.mlp.experts.3.up_proj", "model.layers.52.mlp.experts.4.up_proj", "model.layers.52.mlp.experts.5.up_proj", "model.layers.52.mlp.experts.6.up_proj", "model.layers.52.mlp.experts.7.up_proj", "model.layers.52.mlp.experts.8.up_proj", "model.layers.52.mlp.experts.9.up_proj", "model.layers.52.mlp.experts.10.up_proj", "model.layers.52.mlp.experts.11.up_proj", "model.layers.52.mlp.experts.12.up_proj", "model.layers.52.mlp.experts.13.up_proj", "model.layers.52.mlp.experts.14.up_proj", "model.layers.52.mlp.experts.15.up_proj", "model.layers.52.mlp.experts.16.up_proj", "model.layers.52.mlp.experts.17.up_proj", "model.layers.52.mlp.experts.18.up_proj", "model.layers.52.mlp.experts.19.up_proj", "model.layers.52.mlp.experts.20.up_proj", "model.layers.52.mlp.experts.21.up_proj", "model.layers.52.mlp.experts.22.up_proj", "model.layers.52.mlp.experts.23.up_proj", "model.layers.52.mlp.experts.24.up_proj", "model.layers.52.mlp.experts.25.up_proj", "model.layers.52.mlp.experts.26.up_proj", "model.layers.52.mlp.experts.27.up_proj", "model.layers.52.mlp.experts.28.up_proj", "model.layers.52.mlp.experts.29.up_proj", "model.layers.52.mlp.experts.30.up_proj", "model.layers.52.mlp.experts.31.up_proj", "model.layers.52.mlp.experts.32.up_proj", "model.layers.52.mlp.experts.33.up_proj", "model.layers.52.mlp.experts.34.up_proj", "model.layers.52.mlp.experts.35.up_proj", "model.layers.52.mlp.experts.36.up_proj", "model.layers.52.mlp.experts.37.up_proj", "model.layers.52.mlp.experts.38.up_proj", "model.layers.52.mlp.experts.39.up_proj", "model.layers.52.mlp.experts.40.up_proj", "model.layers.52.mlp.experts.41.up_proj", "model.layers.52.mlp.experts.42.up_proj", "model.layers.52.mlp.experts.43.up_proj", "model.layers.52.mlp.experts.44.up_proj", "model.layers.52.mlp.experts.45.up_proj", "model.layers.52.mlp.experts.46.up_proj", "model.layers.52.mlp.experts.47.up_proj", "model.layers.52.mlp.experts.48.up_proj", "model.layers.52.mlp.experts.49.up_proj", "model.layers.52.mlp.experts.50.up_proj", "model.layers.52.mlp.experts.51.up_proj", "model.layers.52.mlp.experts.52.up_proj", "model.layers.52.mlp.experts.53.up_proj", "model.layers.52.mlp.experts.54.up_proj", "model.layers.52.mlp.experts.55.up_proj", "model.layers.52.mlp.experts.56.up_proj", "model.layers.52.mlp.experts.57.up_proj", "model.layers.52.mlp.experts.58.up_proj", "model.layers.52.mlp.experts.59.up_proj", "model.layers.52.mlp.experts.60.up_proj", "model.layers.52.mlp.experts.61.up_proj", "model.layers.52.mlp.experts.62.up_proj", "model.layers.52.mlp.experts.63.up_proj", "model.layers.52.mlp.experts.64.up_proj", "model.layers.52.mlp.experts.65.up_proj", "model.layers.52.mlp.experts.66.up_proj", "model.layers.52.mlp.experts.67.up_proj", "model.layers.52.mlp.experts.68.up_proj", "model.layers.52.mlp.experts.69.up_proj", "model.layers.52.mlp.experts.70.up_proj", "model.layers.52.mlp.experts.71.up_proj", "model.layers.52.mlp.experts.72.up_proj", "model.layers.52.mlp.experts.73.up_proj", "model.layers.52.mlp.experts.74.up_proj", "model.layers.52.mlp.experts.75.up_proj", "model.layers.52.mlp.experts.76.up_proj", "model.layers.52.mlp.experts.77.up_proj", "model.layers.52.mlp.experts.78.up_proj", "model.layers.52.mlp.experts.79.up_proj", "model.layers.52.mlp.experts.80.up_proj", "model.layers.52.mlp.experts.81.up_proj", "model.layers.52.mlp.experts.82.up_proj", "model.layers.52.mlp.experts.83.up_proj", "model.layers.52.mlp.experts.84.up_proj", "model.layers.52.mlp.experts.85.up_proj", "model.layers.52.mlp.experts.86.up_proj", "model.layers.52.mlp.experts.87.up_proj", "model.layers.52.mlp.experts.88.up_proj", "model.layers.52.mlp.experts.89.up_proj", "model.layers.52.mlp.experts.90.up_proj", "model.layers.52.mlp.experts.91.up_proj", "model.layers.52.mlp.experts.92.up_proj", "model.layers.52.mlp.experts.93.up_proj", "model.layers.52.mlp.experts.94.up_proj", "model.layers.52.mlp.experts.95.up_proj", "model.layers.52.mlp.experts.96.up_proj", "model.layers.52.mlp.experts.97.up_proj", "model.layers.52.mlp.experts.98.up_proj", "model.layers.52.mlp.experts.99.up_proj", "model.layers.52.mlp.experts.100.up_proj", "model.layers.52.mlp.experts.101.up_proj", "model.layers.52.mlp.experts.102.up_proj", "model.layers.52.mlp.experts.103.up_proj", "model.layers.52.mlp.experts.104.up_proj", "model.layers.52.mlp.experts.105.up_proj", "model.layers.52.mlp.experts.106.up_proj", "model.layers.52.mlp.experts.107.up_proj", "model.layers.52.mlp.experts.108.up_proj", "model.layers.52.mlp.experts.109.up_proj", "model.layers.52.mlp.experts.110.up_proj", "model.layers.52.mlp.experts.111.up_proj", "model.layers.52.mlp.experts.112.up_proj", "model.layers.52.mlp.experts.113.up_proj", "model.layers.52.mlp.experts.114.up_proj", "model.layers.52.mlp.experts.115.up_proj", "model.layers.52.mlp.experts.116.up_proj", "model.layers.52.mlp.experts.117.up_proj", "model.layers.52.mlp.experts.118.up_proj", "model.layers.52.mlp.experts.119.up_proj", "model.layers.52.mlp.experts.120.up_proj", "model.layers.52.mlp.experts.121.up_proj", "model.layers.52.mlp.experts.122.up_proj", "model.layers.52.mlp.experts.123.up_proj", "model.layers.52.mlp.experts.124.up_proj", "model.layers.52.mlp.experts.125.up_proj", "model.layers.52.mlp.experts.126.up_proj", "model.layers.52.mlp.experts.127.up_proj", "model.layers.52.mlp.experts.128.up_proj", "model.layers.52.mlp.experts.129.up_proj", "model.layers.52.mlp.experts.130.up_proj", "model.layers.52.mlp.experts.131.up_proj", "model.layers.52.mlp.experts.132.up_proj", "model.layers.52.mlp.experts.133.up_proj", "model.layers.52.mlp.experts.134.up_proj", "model.layers.52.mlp.experts.135.up_proj", "model.layers.52.mlp.experts.136.up_proj", "model.layers.52.mlp.experts.137.up_proj", "model.layers.52.mlp.experts.138.up_proj", "model.layers.52.mlp.experts.139.up_proj", "model.layers.52.mlp.experts.140.up_proj", "model.layers.52.mlp.experts.141.up_proj", "model.layers.52.mlp.experts.142.up_proj", "model.layers.52.mlp.experts.143.up_proj", "model.layers.52.mlp.experts.144.up_proj", "model.layers.52.mlp.experts.145.up_proj", "model.layers.52.mlp.experts.146.up_proj", "model.layers.52.mlp.experts.147.up_proj", "model.layers.52.mlp.experts.148.up_proj", "model.layers.52.mlp.experts.149.up_proj", "model.layers.52.mlp.experts.150.up_proj", "model.layers.52.mlp.experts.151.up_proj", "model.layers.52.mlp.experts.152.up_proj", "model.layers.52.mlp.experts.153.up_proj", "model.layers.52.mlp.experts.154.up_proj", "model.layers.52.mlp.experts.155.up_proj", "model.layers.52.mlp.experts.156.up_proj", "model.layers.52.mlp.experts.157.up_proj", "model.layers.52.mlp.experts.158.up_proj", "model.layers.52.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -2.4388940073548707e-05, "dbits": 2516582400 }, { "dkld": -1.1065974831574177e-06, "dbits": 5033164800 } ] }, { "idx": 314, "layers": [ "model.layers.52.mlp.experts.0.down_proj", "model.layers.52.mlp.experts.1.down_proj", "model.layers.52.mlp.experts.2.down_proj", "model.layers.52.mlp.experts.3.down_proj", "model.layers.52.mlp.experts.4.down_proj", "model.layers.52.mlp.experts.5.down_proj", "model.layers.52.mlp.experts.6.down_proj", "model.layers.52.mlp.experts.7.down_proj", "model.layers.52.mlp.experts.8.down_proj", "model.layers.52.mlp.experts.9.down_proj", "model.layers.52.mlp.experts.10.down_proj", "model.layers.52.mlp.experts.11.down_proj", "model.layers.52.mlp.experts.12.down_proj", "model.layers.52.mlp.experts.13.down_proj", "model.layers.52.mlp.experts.14.down_proj", "model.layers.52.mlp.experts.15.down_proj", "model.layers.52.mlp.experts.16.down_proj", "model.layers.52.mlp.experts.17.down_proj", "model.layers.52.mlp.experts.18.down_proj", "model.layers.52.mlp.experts.19.down_proj", "model.layers.52.mlp.experts.20.down_proj", "model.layers.52.mlp.experts.21.down_proj", "model.layers.52.mlp.experts.22.down_proj", "model.layers.52.mlp.experts.23.down_proj", "model.layers.52.mlp.experts.24.down_proj", "model.layers.52.mlp.experts.25.down_proj", "model.layers.52.mlp.experts.26.down_proj", "model.layers.52.mlp.experts.27.down_proj", "model.layers.52.mlp.experts.28.down_proj", "model.layers.52.mlp.experts.29.down_proj", "model.layers.52.mlp.experts.30.down_proj", "model.layers.52.mlp.experts.31.down_proj", "model.layers.52.mlp.experts.32.down_proj", "model.layers.52.mlp.experts.33.down_proj", "model.layers.52.mlp.experts.34.down_proj", "model.layers.52.mlp.experts.35.down_proj", "model.layers.52.mlp.experts.36.down_proj", "model.layers.52.mlp.experts.37.down_proj", "model.layers.52.mlp.experts.38.down_proj", "model.layers.52.mlp.experts.39.down_proj", "model.layers.52.mlp.experts.40.down_proj", "model.layers.52.mlp.experts.41.down_proj", "model.layers.52.mlp.experts.42.down_proj", "model.layers.52.mlp.experts.43.down_proj", "model.layers.52.mlp.experts.44.down_proj", "model.layers.52.mlp.experts.45.down_proj", "model.layers.52.mlp.experts.46.down_proj", "model.layers.52.mlp.experts.47.down_proj", "model.layers.52.mlp.experts.48.down_proj", "model.layers.52.mlp.experts.49.down_proj", "model.layers.52.mlp.experts.50.down_proj", "model.layers.52.mlp.experts.51.down_proj", "model.layers.52.mlp.experts.52.down_proj", "model.layers.52.mlp.experts.53.down_proj", "model.layers.52.mlp.experts.54.down_proj", "model.layers.52.mlp.experts.55.down_proj", "model.layers.52.mlp.experts.56.down_proj", "model.layers.52.mlp.experts.57.down_proj", "model.layers.52.mlp.experts.58.down_proj", "model.layers.52.mlp.experts.59.down_proj", "model.layers.52.mlp.experts.60.down_proj", "model.layers.52.mlp.experts.61.down_proj", "model.layers.52.mlp.experts.62.down_proj", "model.layers.52.mlp.experts.63.down_proj", "model.layers.52.mlp.experts.64.down_proj", "model.layers.52.mlp.experts.65.down_proj", "model.layers.52.mlp.experts.66.down_proj", "model.layers.52.mlp.experts.67.down_proj", "model.layers.52.mlp.experts.68.down_proj", "model.layers.52.mlp.experts.69.down_proj", "model.layers.52.mlp.experts.70.down_proj", "model.layers.52.mlp.experts.71.down_proj", "model.layers.52.mlp.experts.72.down_proj", "model.layers.52.mlp.experts.73.down_proj", "model.layers.52.mlp.experts.74.down_proj", "model.layers.52.mlp.experts.75.down_proj", "model.layers.52.mlp.experts.76.down_proj", "model.layers.52.mlp.experts.77.down_proj", "model.layers.52.mlp.experts.78.down_proj", "model.layers.52.mlp.experts.79.down_proj", "model.layers.52.mlp.experts.80.down_proj", "model.layers.52.mlp.experts.81.down_proj", "model.layers.52.mlp.experts.82.down_proj", "model.layers.52.mlp.experts.83.down_proj", "model.layers.52.mlp.experts.84.down_proj", "model.layers.52.mlp.experts.85.down_proj", "model.layers.52.mlp.experts.86.down_proj", "model.layers.52.mlp.experts.87.down_proj", "model.layers.52.mlp.experts.88.down_proj", "model.layers.52.mlp.experts.89.down_proj", "model.layers.52.mlp.experts.90.down_proj", "model.layers.52.mlp.experts.91.down_proj", "model.layers.52.mlp.experts.92.down_proj", "model.layers.52.mlp.experts.93.down_proj", "model.layers.52.mlp.experts.94.down_proj", "model.layers.52.mlp.experts.95.down_proj", "model.layers.52.mlp.experts.96.down_proj", "model.layers.52.mlp.experts.97.down_proj", "model.layers.52.mlp.experts.98.down_proj", "model.layers.52.mlp.experts.99.down_proj", "model.layers.52.mlp.experts.100.down_proj", "model.layers.52.mlp.experts.101.down_proj", "model.layers.52.mlp.experts.102.down_proj", "model.layers.52.mlp.experts.103.down_proj", "model.layers.52.mlp.experts.104.down_proj", "model.layers.52.mlp.experts.105.down_proj", "model.layers.52.mlp.experts.106.down_proj", "model.layers.52.mlp.experts.107.down_proj", "model.layers.52.mlp.experts.108.down_proj", "model.layers.52.mlp.experts.109.down_proj", "model.layers.52.mlp.experts.110.down_proj", "model.layers.52.mlp.experts.111.down_proj", "model.layers.52.mlp.experts.112.down_proj", "model.layers.52.mlp.experts.113.down_proj", "model.layers.52.mlp.experts.114.down_proj", "model.layers.52.mlp.experts.115.down_proj", "model.layers.52.mlp.experts.116.down_proj", "model.layers.52.mlp.experts.117.down_proj", "model.layers.52.mlp.experts.118.down_proj", "model.layers.52.mlp.experts.119.down_proj", "model.layers.52.mlp.experts.120.down_proj", "model.layers.52.mlp.experts.121.down_proj", "model.layers.52.mlp.experts.122.down_proj", "model.layers.52.mlp.experts.123.down_proj", "model.layers.52.mlp.experts.124.down_proj", "model.layers.52.mlp.experts.125.down_proj", "model.layers.52.mlp.experts.126.down_proj", "model.layers.52.mlp.experts.127.down_proj", "model.layers.52.mlp.experts.128.down_proj", "model.layers.52.mlp.experts.129.down_proj", "model.layers.52.mlp.experts.130.down_proj", "model.layers.52.mlp.experts.131.down_proj", "model.layers.52.mlp.experts.132.down_proj", "model.layers.52.mlp.experts.133.down_proj", "model.layers.52.mlp.experts.134.down_proj", "model.layers.52.mlp.experts.135.down_proj", "model.layers.52.mlp.experts.136.down_proj", "model.layers.52.mlp.experts.137.down_proj", "model.layers.52.mlp.experts.138.down_proj", "model.layers.52.mlp.experts.139.down_proj", "model.layers.52.mlp.experts.140.down_proj", "model.layers.52.mlp.experts.141.down_proj", "model.layers.52.mlp.experts.142.down_proj", "model.layers.52.mlp.experts.143.down_proj", "model.layers.52.mlp.experts.144.down_proj", "model.layers.52.mlp.experts.145.down_proj", "model.layers.52.mlp.experts.146.down_proj", "model.layers.52.mlp.experts.147.down_proj", "model.layers.52.mlp.experts.148.down_proj", "model.layers.52.mlp.experts.149.down_proj", "model.layers.52.mlp.experts.150.down_proj", "model.layers.52.mlp.experts.151.down_proj", "model.layers.52.mlp.experts.152.down_proj", "model.layers.52.mlp.experts.153.down_proj", "model.layers.52.mlp.experts.154.down_proj", "model.layers.52.mlp.experts.155.down_proj", "model.layers.52.mlp.experts.156.down_proj", "model.layers.52.mlp.experts.157.down_proj", "model.layers.52.mlp.experts.158.down_proj", "model.layers.52.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.2618163600562615e-05, "dbits": 1258291200 }, { "dkld": 1.9686296582228924e-06, "dbits": 2516582400 } ] }, { "idx": 315, "layers": [ "model.layers.53.self_attn.q_proj" ], "candidates": [ { "dkld": -2.967710606753722e-05, "dbits": 62914560 }, { "dkld": -9.749084711074829e-06, "dbits": 125829120 } ] }, { "idx": 316, "layers": [ "model.layers.53.self_attn.k_proj", "model.layers.53.self_attn.v_proj" ], "candidates": [ { "dkld": 2.4629058316349983e-05, "dbits": 10485760 }, { "dkld": 4.0858518332246435e-06, "dbits": 20971520 } ] }, { "idx": 317, "layers": [ "model.layers.53.self_attn.o_proj" ], "candidates": [ { "dkld": -4.671078640967538e-05, "dbits": 62914560 }, { "dkld": -4.6710483729839325e-05, "dbits": 125829120 } ] }, { "idx": 318, "layers": [ "model.layers.53.mlp.shared_experts.gate_proj", "model.layers.53.mlp.shared_experts.up_proj", "model.layers.53.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 1.5312409959734527e-05, "dbits": 23592960 }, { "dkld": 2.256964799016853e-05, "dbits": 47185920 } ] }, { "idx": 319, "layers": [ "model.layers.53.mlp.experts.0.gate_proj", "model.layers.53.mlp.experts.1.gate_proj", "model.layers.53.mlp.experts.2.gate_proj", "model.layers.53.mlp.experts.3.gate_proj", "model.layers.53.mlp.experts.4.gate_proj", "model.layers.53.mlp.experts.5.gate_proj", "model.layers.53.mlp.experts.6.gate_proj", "model.layers.53.mlp.experts.7.gate_proj", "model.layers.53.mlp.experts.8.gate_proj", "model.layers.53.mlp.experts.9.gate_proj", "model.layers.53.mlp.experts.10.gate_proj", "model.layers.53.mlp.experts.11.gate_proj", "model.layers.53.mlp.experts.12.gate_proj", "model.layers.53.mlp.experts.13.gate_proj", "model.layers.53.mlp.experts.14.gate_proj", "model.layers.53.mlp.experts.15.gate_proj", "model.layers.53.mlp.experts.16.gate_proj", "model.layers.53.mlp.experts.17.gate_proj", "model.layers.53.mlp.experts.18.gate_proj", "model.layers.53.mlp.experts.19.gate_proj", "model.layers.53.mlp.experts.20.gate_proj", "model.layers.53.mlp.experts.21.gate_proj", "model.layers.53.mlp.experts.22.gate_proj", "model.layers.53.mlp.experts.23.gate_proj", "model.layers.53.mlp.experts.24.gate_proj", "model.layers.53.mlp.experts.25.gate_proj", "model.layers.53.mlp.experts.26.gate_proj", "model.layers.53.mlp.experts.27.gate_proj", "model.layers.53.mlp.experts.28.gate_proj", "model.layers.53.mlp.experts.29.gate_proj", "model.layers.53.mlp.experts.30.gate_proj", "model.layers.53.mlp.experts.31.gate_proj", "model.layers.53.mlp.experts.32.gate_proj", "model.layers.53.mlp.experts.33.gate_proj", "model.layers.53.mlp.experts.34.gate_proj", "model.layers.53.mlp.experts.35.gate_proj", "model.layers.53.mlp.experts.36.gate_proj", "model.layers.53.mlp.experts.37.gate_proj", "model.layers.53.mlp.experts.38.gate_proj", "model.layers.53.mlp.experts.39.gate_proj", "model.layers.53.mlp.experts.40.gate_proj", "model.layers.53.mlp.experts.41.gate_proj", "model.layers.53.mlp.experts.42.gate_proj", "model.layers.53.mlp.experts.43.gate_proj", "model.layers.53.mlp.experts.44.gate_proj", "model.layers.53.mlp.experts.45.gate_proj", "model.layers.53.mlp.experts.46.gate_proj", "model.layers.53.mlp.experts.47.gate_proj", "model.layers.53.mlp.experts.48.gate_proj", "model.layers.53.mlp.experts.49.gate_proj", "model.layers.53.mlp.experts.50.gate_proj", "model.layers.53.mlp.experts.51.gate_proj", "model.layers.53.mlp.experts.52.gate_proj", "model.layers.53.mlp.experts.53.gate_proj", "model.layers.53.mlp.experts.54.gate_proj", "model.layers.53.mlp.experts.55.gate_proj", "model.layers.53.mlp.experts.56.gate_proj", "model.layers.53.mlp.experts.57.gate_proj", "model.layers.53.mlp.experts.58.gate_proj", "model.layers.53.mlp.experts.59.gate_proj", "model.layers.53.mlp.experts.60.gate_proj", "model.layers.53.mlp.experts.61.gate_proj", "model.layers.53.mlp.experts.62.gate_proj", "model.layers.53.mlp.experts.63.gate_proj", "model.layers.53.mlp.experts.64.gate_proj", "model.layers.53.mlp.experts.65.gate_proj", "model.layers.53.mlp.experts.66.gate_proj", "model.layers.53.mlp.experts.67.gate_proj", "model.layers.53.mlp.experts.68.gate_proj", "model.layers.53.mlp.experts.69.gate_proj", "model.layers.53.mlp.experts.70.gate_proj", "model.layers.53.mlp.experts.71.gate_proj", "model.layers.53.mlp.experts.72.gate_proj", "model.layers.53.mlp.experts.73.gate_proj", "model.layers.53.mlp.experts.74.gate_proj", "model.layers.53.mlp.experts.75.gate_proj", "model.layers.53.mlp.experts.76.gate_proj", "model.layers.53.mlp.experts.77.gate_proj", "model.layers.53.mlp.experts.78.gate_proj", "model.layers.53.mlp.experts.79.gate_proj", "model.layers.53.mlp.experts.80.gate_proj", "model.layers.53.mlp.experts.81.gate_proj", "model.layers.53.mlp.experts.82.gate_proj", "model.layers.53.mlp.experts.83.gate_proj", "model.layers.53.mlp.experts.84.gate_proj", "model.layers.53.mlp.experts.85.gate_proj", "model.layers.53.mlp.experts.86.gate_proj", "model.layers.53.mlp.experts.87.gate_proj", "model.layers.53.mlp.experts.88.gate_proj", "model.layers.53.mlp.experts.89.gate_proj", "model.layers.53.mlp.experts.90.gate_proj", "model.layers.53.mlp.experts.91.gate_proj", "model.layers.53.mlp.experts.92.gate_proj", "model.layers.53.mlp.experts.93.gate_proj", "model.layers.53.mlp.experts.94.gate_proj", "model.layers.53.mlp.experts.95.gate_proj", "model.layers.53.mlp.experts.96.gate_proj", "model.layers.53.mlp.experts.97.gate_proj", "model.layers.53.mlp.experts.98.gate_proj", "model.layers.53.mlp.experts.99.gate_proj", "model.layers.53.mlp.experts.100.gate_proj", "model.layers.53.mlp.experts.101.gate_proj", "model.layers.53.mlp.experts.102.gate_proj", "model.layers.53.mlp.experts.103.gate_proj", "model.layers.53.mlp.experts.104.gate_proj", "model.layers.53.mlp.experts.105.gate_proj", "model.layers.53.mlp.experts.106.gate_proj", "model.layers.53.mlp.experts.107.gate_proj", "model.layers.53.mlp.experts.108.gate_proj", "model.layers.53.mlp.experts.109.gate_proj", "model.layers.53.mlp.experts.110.gate_proj", "model.layers.53.mlp.experts.111.gate_proj", "model.layers.53.mlp.experts.112.gate_proj", "model.layers.53.mlp.experts.113.gate_proj", "model.layers.53.mlp.experts.114.gate_proj", "model.layers.53.mlp.experts.115.gate_proj", "model.layers.53.mlp.experts.116.gate_proj", "model.layers.53.mlp.experts.117.gate_proj", "model.layers.53.mlp.experts.118.gate_proj", "model.layers.53.mlp.experts.119.gate_proj", "model.layers.53.mlp.experts.120.gate_proj", "model.layers.53.mlp.experts.121.gate_proj", "model.layers.53.mlp.experts.122.gate_proj", "model.layers.53.mlp.experts.123.gate_proj", "model.layers.53.mlp.experts.124.gate_proj", "model.layers.53.mlp.experts.125.gate_proj", "model.layers.53.mlp.experts.126.gate_proj", "model.layers.53.mlp.experts.127.gate_proj", "model.layers.53.mlp.experts.128.gate_proj", "model.layers.53.mlp.experts.129.gate_proj", "model.layers.53.mlp.experts.130.gate_proj", "model.layers.53.mlp.experts.131.gate_proj", "model.layers.53.mlp.experts.132.gate_proj", "model.layers.53.mlp.experts.133.gate_proj", "model.layers.53.mlp.experts.134.gate_proj", "model.layers.53.mlp.experts.135.gate_proj", "model.layers.53.mlp.experts.136.gate_proj", "model.layers.53.mlp.experts.137.gate_proj", "model.layers.53.mlp.experts.138.gate_proj", "model.layers.53.mlp.experts.139.gate_proj", "model.layers.53.mlp.experts.140.gate_proj", "model.layers.53.mlp.experts.141.gate_proj", "model.layers.53.mlp.experts.142.gate_proj", "model.layers.53.mlp.experts.143.gate_proj", "model.layers.53.mlp.experts.144.gate_proj", "model.layers.53.mlp.experts.145.gate_proj", "model.layers.53.mlp.experts.146.gate_proj", "model.layers.53.mlp.experts.147.gate_proj", "model.layers.53.mlp.experts.148.gate_proj", "model.layers.53.mlp.experts.149.gate_proj", "model.layers.53.mlp.experts.150.gate_proj", "model.layers.53.mlp.experts.151.gate_proj", "model.layers.53.mlp.experts.152.gate_proj", "model.layers.53.mlp.experts.153.gate_proj", "model.layers.53.mlp.experts.154.gate_proj", "model.layers.53.mlp.experts.155.gate_proj", "model.layers.53.mlp.experts.156.gate_proj", "model.layers.53.mlp.experts.157.gate_proj", "model.layers.53.mlp.experts.158.gate_proj", "model.layers.53.mlp.experts.159.gate_proj", "model.layers.53.mlp.experts.0.up_proj", "model.layers.53.mlp.experts.1.up_proj", "model.layers.53.mlp.experts.2.up_proj", "model.layers.53.mlp.experts.3.up_proj", "model.layers.53.mlp.experts.4.up_proj", "model.layers.53.mlp.experts.5.up_proj", "model.layers.53.mlp.experts.6.up_proj", "model.layers.53.mlp.experts.7.up_proj", "model.layers.53.mlp.experts.8.up_proj", "model.layers.53.mlp.experts.9.up_proj", "model.layers.53.mlp.experts.10.up_proj", "model.layers.53.mlp.experts.11.up_proj", "model.layers.53.mlp.experts.12.up_proj", "model.layers.53.mlp.experts.13.up_proj", "model.layers.53.mlp.experts.14.up_proj", "model.layers.53.mlp.experts.15.up_proj", "model.layers.53.mlp.experts.16.up_proj", "model.layers.53.mlp.experts.17.up_proj", "model.layers.53.mlp.experts.18.up_proj", "model.layers.53.mlp.experts.19.up_proj", "model.layers.53.mlp.experts.20.up_proj", "model.layers.53.mlp.experts.21.up_proj", "model.layers.53.mlp.experts.22.up_proj", "model.layers.53.mlp.experts.23.up_proj", "model.layers.53.mlp.experts.24.up_proj", "model.layers.53.mlp.experts.25.up_proj", "model.layers.53.mlp.experts.26.up_proj", "model.layers.53.mlp.experts.27.up_proj", "model.layers.53.mlp.experts.28.up_proj", "model.layers.53.mlp.experts.29.up_proj", "model.layers.53.mlp.experts.30.up_proj", "model.layers.53.mlp.experts.31.up_proj", "model.layers.53.mlp.experts.32.up_proj", "model.layers.53.mlp.experts.33.up_proj", "model.layers.53.mlp.experts.34.up_proj", "model.layers.53.mlp.experts.35.up_proj", "model.layers.53.mlp.experts.36.up_proj", "model.layers.53.mlp.experts.37.up_proj", "model.layers.53.mlp.experts.38.up_proj", "model.layers.53.mlp.experts.39.up_proj", "model.layers.53.mlp.experts.40.up_proj", "model.layers.53.mlp.experts.41.up_proj", "model.layers.53.mlp.experts.42.up_proj", "model.layers.53.mlp.experts.43.up_proj", "model.layers.53.mlp.experts.44.up_proj", "model.layers.53.mlp.experts.45.up_proj", "model.layers.53.mlp.experts.46.up_proj", "model.layers.53.mlp.experts.47.up_proj", "model.layers.53.mlp.experts.48.up_proj", "model.layers.53.mlp.experts.49.up_proj", "model.layers.53.mlp.experts.50.up_proj", "model.layers.53.mlp.experts.51.up_proj", "model.layers.53.mlp.experts.52.up_proj", "model.layers.53.mlp.experts.53.up_proj", "model.layers.53.mlp.experts.54.up_proj", "model.layers.53.mlp.experts.55.up_proj", "model.layers.53.mlp.experts.56.up_proj", "model.layers.53.mlp.experts.57.up_proj", "model.layers.53.mlp.experts.58.up_proj", "model.layers.53.mlp.experts.59.up_proj", "model.layers.53.mlp.experts.60.up_proj", "model.layers.53.mlp.experts.61.up_proj", "model.layers.53.mlp.experts.62.up_proj", "model.layers.53.mlp.experts.63.up_proj", "model.layers.53.mlp.experts.64.up_proj", "model.layers.53.mlp.experts.65.up_proj", "model.layers.53.mlp.experts.66.up_proj", "model.layers.53.mlp.experts.67.up_proj", "model.layers.53.mlp.experts.68.up_proj", "model.layers.53.mlp.experts.69.up_proj", "model.layers.53.mlp.experts.70.up_proj", "model.layers.53.mlp.experts.71.up_proj", "model.layers.53.mlp.experts.72.up_proj", "model.layers.53.mlp.experts.73.up_proj", "model.layers.53.mlp.experts.74.up_proj", "model.layers.53.mlp.experts.75.up_proj", "model.layers.53.mlp.experts.76.up_proj", "model.layers.53.mlp.experts.77.up_proj", "model.layers.53.mlp.experts.78.up_proj", "model.layers.53.mlp.experts.79.up_proj", "model.layers.53.mlp.experts.80.up_proj", "model.layers.53.mlp.experts.81.up_proj", "model.layers.53.mlp.experts.82.up_proj", "model.layers.53.mlp.experts.83.up_proj", "model.layers.53.mlp.experts.84.up_proj", "model.layers.53.mlp.experts.85.up_proj", "model.layers.53.mlp.experts.86.up_proj", "model.layers.53.mlp.experts.87.up_proj", "model.layers.53.mlp.experts.88.up_proj", "model.layers.53.mlp.experts.89.up_proj", "model.layers.53.mlp.experts.90.up_proj", "model.layers.53.mlp.experts.91.up_proj", "model.layers.53.mlp.experts.92.up_proj", "model.layers.53.mlp.experts.93.up_proj", "model.layers.53.mlp.experts.94.up_proj", "model.layers.53.mlp.experts.95.up_proj", "model.layers.53.mlp.experts.96.up_proj", "model.layers.53.mlp.experts.97.up_proj", "model.layers.53.mlp.experts.98.up_proj", "model.layers.53.mlp.experts.99.up_proj", "model.layers.53.mlp.experts.100.up_proj", "model.layers.53.mlp.experts.101.up_proj", "model.layers.53.mlp.experts.102.up_proj", "model.layers.53.mlp.experts.103.up_proj", "model.layers.53.mlp.experts.104.up_proj", "model.layers.53.mlp.experts.105.up_proj", "model.layers.53.mlp.experts.106.up_proj", "model.layers.53.mlp.experts.107.up_proj", "model.layers.53.mlp.experts.108.up_proj", "model.layers.53.mlp.experts.109.up_proj", "model.layers.53.mlp.experts.110.up_proj", "model.layers.53.mlp.experts.111.up_proj", "model.layers.53.mlp.experts.112.up_proj", "model.layers.53.mlp.experts.113.up_proj", "model.layers.53.mlp.experts.114.up_proj", "model.layers.53.mlp.experts.115.up_proj", "model.layers.53.mlp.experts.116.up_proj", "model.layers.53.mlp.experts.117.up_proj", "model.layers.53.mlp.experts.118.up_proj", "model.layers.53.mlp.experts.119.up_proj", "model.layers.53.mlp.experts.120.up_proj", "model.layers.53.mlp.experts.121.up_proj", "model.layers.53.mlp.experts.122.up_proj", "model.layers.53.mlp.experts.123.up_proj", "model.layers.53.mlp.experts.124.up_proj", "model.layers.53.mlp.experts.125.up_proj", "model.layers.53.mlp.experts.126.up_proj", "model.layers.53.mlp.experts.127.up_proj", "model.layers.53.mlp.experts.128.up_proj", "model.layers.53.mlp.experts.129.up_proj", "model.layers.53.mlp.experts.130.up_proj", "model.layers.53.mlp.experts.131.up_proj", "model.layers.53.mlp.experts.132.up_proj", "model.layers.53.mlp.experts.133.up_proj", "model.layers.53.mlp.experts.134.up_proj", "model.layers.53.mlp.experts.135.up_proj", "model.layers.53.mlp.experts.136.up_proj", "model.layers.53.mlp.experts.137.up_proj", "model.layers.53.mlp.experts.138.up_proj", "model.layers.53.mlp.experts.139.up_proj", "model.layers.53.mlp.experts.140.up_proj", "model.layers.53.mlp.experts.141.up_proj", "model.layers.53.mlp.experts.142.up_proj", "model.layers.53.mlp.experts.143.up_proj", "model.layers.53.mlp.experts.144.up_proj", "model.layers.53.mlp.experts.145.up_proj", "model.layers.53.mlp.experts.146.up_proj", "model.layers.53.mlp.experts.147.up_proj", "model.layers.53.mlp.experts.148.up_proj", "model.layers.53.mlp.experts.149.up_proj", "model.layers.53.mlp.experts.150.up_proj", "model.layers.53.mlp.experts.151.up_proj", "model.layers.53.mlp.experts.152.up_proj", "model.layers.53.mlp.experts.153.up_proj", "model.layers.53.mlp.experts.154.up_proj", "model.layers.53.mlp.experts.155.up_proj", "model.layers.53.mlp.experts.156.up_proj", "model.layers.53.mlp.experts.157.up_proj", "model.layers.53.mlp.experts.158.up_proj", "model.layers.53.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 4.534935578705268e-06, "dbits": 2516582400 }, { "dkld": 1.0309065692127098e-05, "dbits": 5033164800 } ] }, { "idx": 320, "layers": [ "model.layers.53.mlp.experts.0.down_proj", "model.layers.53.mlp.experts.1.down_proj", "model.layers.53.mlp.experts.2.down_proj", "model.layers.53.mlp.experts.3.down_proj", "model.layers.53.mlp.experts.4.down_proj", "model.layers.53.mlp.experts.5.down_proj", "model.layers.53.mlp.experts.6.down_proj", "model.layers.53.mlp.experts.7.down_proj", "model.layers.53.mlp.experts.8.down_proj", "model.layers.53.mlp.experts.9.down_proj", "model.layers.53.mlp.experts.10.down_proj", "model.layers.53.mlp.experts.11.down_proj", "model.layers.53.mlp.experts.12.down_proj", "model.layers.53.mlp.experts.13.down_proj", "model.layers.53.mlp.experts.14.down_proj", "model.layers.53.mlp.experts.15.down_proj", "model.layers.53.mlp.experts.16.down_proj", "model.layers.53.mlp.experts.17.down_proj", "model.layers.53.mlp.experts.18.down_proj", "model.layers.53.mlp.experts.19.down_proj", "model.layers.53.mlp.experts.20.down_proj", "model.layers.53.mlp.experts.21.down_proj", "model.layers.53.mlp.experts.22.down_proj", "model.layers.53.mlp.experts.23.down_proj", "model.layers.53.mlp.experts.24.down_proj", "model.layers.53.mlp.experts.25.down_proj", "model.layers.53.mlp.experts.26.down_proj", "model.layers.53.mlp.experts.27.down_proj", "model.layers.53.mlp.experts.28.down_proj", "model.layers.53.mlp.experts.29.down_proj", "model.layers.53.mlp.experts.30.down_proj", "model.layers.53.mlp.experts.31.down_proj", "model.layers.53.mlp.experts.32.down_proj", "model.layers.53.mlp.experts.33.down_proj", "model.layers.53.mlp.experts.34.down_proj", "model.layers.53.mlp.experts.35.down_proj", "model.layers.53.mlp.experts.36.down_proj", "model.layers.53.mlp.experts.37.down_proj", "model.layers.53.mlp.experts.38.down_proj", "model.layers.53.mlp.experts.39.down_proj", "model.layers.53.mlp.experts.40.down_proj", "model.layers.53.mlp.experts.41.down_proj", "model.layers.53.mlp.experts.42.down_proj", "model.layers.53.mlp.experts.43.down_proj", "model.layers.53.mlp.experts.44.down_proj", "model.layers.53.mlp.experts.45.down_proj", "model.layers.53.mlp.experts.46.down_proj", "model.layers.53.mlp.experts.47.down_proj", "model.layers.53.mlp.experts.48.down_proj", "model.layers.53.mlp.experts.49.down_proj", "model.layers.53.mlp.experts.50.down_proj", "model.layers.53.mlp.experts.51.down_proj", "model.layers.53.mlp.experts.52.down_proj", "model.layers.53.mlp.experts.53.down_proj", "model.layers.53.mlp.experts.54.down_proj", "model.layers.53.mlp.experts.55.down_proj", "model.layers.53.mlp.experts.56.down_proj", "model.layers.53.mlp.experts.57.down_proj", "model.layers.53.mlp.experts.58.down_proj", "model.layers.53.mlp.experts.59.down_proj", "model.layers.53.mlp.experts.60.down_proj", "model.layers.53.mlp.experts.61.down_proj", "model.layers.53.mlp.experts.62.down_proj", "model.layers.53.mlp.experts.63.down_proj", "model.layers.53.mlp.experts.64.down_proj", "model.layers.53.mlp.experts.65.down_proj", "model.layers.53.mlp.experts.66.down_proj", "model.layers.53.mlp.experts.67.down_proj", "model.layers.53.mlp.experts.68.down_proj", "model.layers.53.mlp.experts.69.down_proj", "model.layers.53.mlp.experts.70.down_proj", "model.layers.53.mlp.experts.71.down_proj", "model.layers.53.mlp.experts.72.down_proj", "model.layers.53.mlp.experts.73.down_proj", "model.layers.53.mlp.experts.74.down_proj", "model.layers.53.mlp.experts.75.down_proj", "model.layers.53.mlp.experts.76.down_proj", "model.layers.53.mlp.experts.77.down_proj", "model.layers.53.mlp.experts.78.down_proj", "model.layers.53.mlp.experts.79.down_proj", "model.layers.53.mlp.experts.80.down_proj", "model.layers.53.mlp.experts.81.down_proj", "model.layers.53.mlp.experts.82.down_proj", "model.layers.53.mlp.experts.83.down_proj", "model.layers.53.mlp.experts.84.down_proj", "model.layers.53.mlp.experts.85.down_proj", "model.layers.53.mlp.experts.86.down_proj", "model.layers.53.mlp.experts.87.down_proj", "model.layers.53.mlp.experts.88.down_proj", "model.layers.53.mlp.experts.89.down_proj", "model.layers.53.mlp.experts.90.down_proj", "model.layers.53.mlp.experts.91.down_proj", "model.layers.53.mlp.experts.92.down_proj", "model.layers.53.mlp.experts.93.down_proj", "model.layers.53.mlp.experts.94.down_proj", "model.layers.53.mlp.experts.95.down_proj", "model.layers.53.mlp.experts.96.down_proj", "model.layers.53.mlp.experts.97.down_proj", "model.layers.53.mlp.experts.98.down_proj", "model.layers.53.mlp.experts.99.down_proj", "model.layers.53.mlp.experts.100.down_proj", "model.layers.53.mlp.experts.101.down_proj", "model.layers.53.mlp.experts.102.down_proj", "model.layers.53.mlp.experts.103.down_proj", "model.layers.53.mlp.experts.104.down_proj", "model.layers.53.mlp.experts.105.down_proj", "model.layers.53.mlp.experts.106.down_proj", "model.layers.53.mlp.experts.107.down_proj", "model.layers.53.mlp.experts.108.down_proj", "model.layers.53.mlp.experts.109.down_proj", "model.layers.53.mlp.experts.110.down_proj", "model.layers.53.mlp.experts.111.down_proj", "model.layers.53.mlp.experts.112.down_proj", "model.layers.53.mlp.experts.113.down_proj", "model.layers.53.mlp.experts.114.down_proj", "model.layers.53.mlp.experts.115.down_proj", "model.layers.53.mlp.experts.116.down_proj", "model.layers.53.mlp.experts.117.down_proj", "model.layers.53.mlp.experts.118.down_proj", "model.layers.53.mlp.experts.119.down_proj", "model.layers.53.mlp.experts.120.down_proj", "model.layers.53.mlp.experts.121.down_proj", "model.layers.53.mlp.experts.122.down_proj", "model.layers.53.mlp.experts.123.down_proj", "model.layers.53.mlp.experts.124.down_proj", "model.layers.53.mlp.experts.125.down_proj", "model.layers.53.mlp.experts.126.down_proj", "model.layers.53.mlp.experts.127.down_proj", "model.layers.53.mlp.experts.128.down_proj", "model.layers.53.mlp.experts.129.down_proj", "model.layers.53.mlp.experts.130.down_proj", "model.layers.53.mlp.experts.131.down_proj", "model.layers.53.mlp.experts.132.down_proj", "model.layers.53.mlp.experts.133.down_proj", "model.layers.53.mlp.experts.134.down_proj", "model.layers.53.mlp.experts.135.down_proj", "model.layers.53.mlp.experts.136.down_proj", "model.layers.53.mlp.experts.137.down_proj", "model.layers.53.mlp.experts.138.down_proj", "model.layers.53.mlp.experts.139.down_proj", "model.layers.53.mlp.experts.140.down_proj", "model.layers.53.mlp.experts.141.down_proj", "model.layers.53.mlp.experts.142.down_proj", "model.layers.53.mlp.experts.143.down_proj", "model.layers.53.mlp.experts.144.down_proj", "model.layers.53.mlp.experts.145.down_proj", "model.layers.53.mlp.experts.146.down_proj", "model.layers.53.mlp.experts.147.down_proj", "model.layers.53.mlp.experts.148.down_proj", "model.layers.53.mlp.experts.149.down_proj", "model.layers.53.mlp.experts.150.down_proj", "model.layers.53.mlp.experts.151.down_proj", "model.layers.53.mlp.experts.152.down_proj", "model.layers.53.mlp.experts.153.down_proj", "model.layers.53.mlp.experts.154.down_proj", "model.layers.53.mlp.experts.155.down_proj", "model.layers.53.mlp.experts.156.down_proj", "model.layers.53.mlp.experts.157.down_proj", "model.layers.53.mlp.experts.158.down_proj", "model.layers.53.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -8.67075286805491e-06, "dbits": 1258291200 }, { "dkld": -1.4350656419991059e-05, "dbits": 2516582400 } ] }, { "idx": 321, "layers": [ "model.layers.54.self_attn.q_proj" ], "candidates": [ { "dkld": -6.662916857749085e-05, "dbits": 62914560 }, { "dkld": -6.852005608379806e-05, "dbits": 125829120 } ] }, { "idx": 322, "layers": [ "model.layers.54.self_attn.k_proj", "model.layers.54.self_attn.v_proj" ], "candidates": [ { "dkld": -8.441112004220486e-05, "dbits": 10485760 }, { "dkld": -8.278263267129556e-05, "dbits": 20971520 } ] }, { "idx": 323, "layers": [ "model.layers.54.self_attn.o_proj" ], "candidates": [ { "dkld": 4.339430015534197e-05, "dbits": 62914560 }, { "dkld": 1.2475205585360874e-05, "dbits": 125829120 } ] }, { "idx": 324, "layers": [ "model.layers.54.mlp.shared_experts.gate_proj", "model.layers.54.mlp.shared_experts.up_proj", "model.layers.54.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 1.3962923549116699e-05, "dbits": 23592960 }, { "dkld": 2.6479153893888344e-05, "dbits": 47185920 } ] }, { "idx": 325, "layers": [ "model.layers.54.mlp.experts.0.gate_proj", "model.layers.54.mlp.experts.1.gate_proj", "model.layers.54.mlp.experts.2.gate_proj", "model.layers.54.mlp.experts.3.gate_proj", "model.layers.54.mlp.experts.4.gate_proj", "model.layers.54.mlp.experts.5.gate_proj", "model.layers.54.mlp.experts.6.gate_proj", "model.layers.54.mlp.experts.7.gate_proj", "model.layers.54.mlp.experts.8.gate_proj", "model.layers.54.mlp.experts.9.gate_proj", "model.layers.54.mlp.experts.10.gate_proj", "model.layers.54.mlp.experts.11.gate_proj", "model.layers.54.mlp.experts.12.gate_proj", "model.layers.54.mlp.experts.13.gate_proj", "model.layers.54.mlp.experts.14.gate_proj", "model.layers.54.mlp.experts.15.gate_proj", "model.layers.54.mlp.experts.16.gate_proj", "model.layers.54.mlp.experts.17.gate_proj", "model.layers.54.mlp.experts.18.gate_proj", "model.layers.54.mlp.experts.19.gate_proj", "model.layers.54.mlp.experts.20.gate_proj", "model.layers.54.mlp.experts.21.gate_proj", "model.layers.54.mlp.experts.22.gate_proj", "model.layers.54.mlp.experts.23.gate_proj", "model.layers.54.mlp.experts.24.gate_proj", "model.layers.54.mlp.experts.25.gate_proj", "model.layers.54.mlp.experts.26.gate_proj", "model.layers.54.mlp.experts.27.gate_proj", "model.layers.54.mlp.experts.28.gate_proj", "model.layers.54.mlp.experts.29.gate_proj", "model.layers.54.mlp.experts.30.gate_proj", "model.layers.54.mlp.experts.31.gate_proj", "model.layers.54.mlp.experts.32.gate_proj", "model.layers.54.mlp.experts.33.gate_proj", "model.layers.54.mlp.experts.34.gate_proj", "model.layers.54.mlp.experts.35.gate_proj", "model.layers.54.mlp.experts.36.gate_proj", "model.layers.54.mlp.experts.37.gate_proj", "model.layers.54.mlp.experts.38.gate_proj", "model.layers.54.mlp.experts.39.gate_proj", "model.layers.54.mlp.experts.40.gate_proj", "model.layers.54.mlp.experts.41.gate_proj", "model.layers.54.mlp.experts.42.gate_proj", "model.layers.54.mlp.experts.43.gate_proj", "model.layers.54.mlp.experts.44.gate_proj", "model.layers.54.mlp.experts.45.gate_proj", "model.layers.54.mlp.experts.46.gate_proj", "model.layers.54.mlp.experts.47.gate_proj", "model.layers.54.mlp.experts.48.gate_proj", "model.layers.54.mlp.experts.49.gate_proj", "model.layers.54.mlp.experts.50.gate_proj", "model.layers.54.mlp.experts.51.gate_proj", "model.layers.54.mlp.experts.52.gate_proj", "model.layers.54.mlp.experts.53.gate_proj", "model.layers.54.mlp.experts.54.gate_proj", "model.layers.54.mlp.experts.55.gate_proj", "model.layers.54.mlp.experts.56.gate_proj", "model.layers.54.mlp.experts.57.gate_proj", "model.layers.54.mlp.experts.58.gate_proj", "model.layers.54.mlp.experts.59.gate_proj", "model.layers.54.mlp.experts.60.gate_proj", "model.layers.54.mlp.experts.61.gate_proj", "model.layers.54.mlp.experts.62.gate_proj", "model.layers.54.mlp.experts.63.gate_proj", "model.layers.54.mlp.experts.64.gate_proj", "model.layers.54.mlp.experts.65.gate_proj", "model.layers.54.mlp.experts.66.gate_proj", "model.layers.54.mlp.experts.67.gate_proj", "model.layers.54.mlp.experts.68.gate_proj", "model.layers.54.mlp.experts.69.gate_proj", "model.layers.54.mlp.experts.70.gate_proj", "model.layers.54.mlp.experts.71.gate_proj", "model.layers.54.mlp.experts.72.gate_proj", "model.layers.54.mlp.experts.73.gate_proj", "model.layers.54.mlp.experts.74.gate_proj", "model.layers.54.mlp.experts.75.gate_proj", "model.layers.54.mlp.experts.76.gate_proj", "model.layers.54.mlp.experts.77.gate_proj", "model.layers.54.mlp.experts.78.gate_proj", "model.layers.54.mlp.experts.79.gate_proj", "model.layers.54.mlp.experts.80.gate_proj", "model.layers.54.mlp.experts.81.gate_proj", "model.layers.54.mlp.experts.82.gate_proj", "model.layers.54.mlp.experts.83.gate_proj", "model.layers.54.mlp.experts.84.gate_proj", "model.layers.54.mlp.experts.85.gate_proj", "model.layers.54.mlp.experts.86.gate_proj", "model.layers.54.mlp.experts.87.gate_proj", "model.layers.54.mlp.experts.88.gate_proj", "model.layers.54.mlp.experts.89.gate_proj", "model.layers.54.mlp.experts.90.gate_proj", "model.layers.54.mlp.experts.91.gate_proj", "model.layers.54.mlp.experts.92.gate_proj", "model.layers.54.mlp.experts.93.gate_proj", "model.layers.54.mlp.experts.94.gate_proj", "model.layers.54.mlp.experts.95.gate_proj", "model.layers.54.mlp.experts.96.gate_proj", "model.layers.54.mlp.experts.97.gate_proj", "model.layers.54.mlp.experts.98.gate_proj", "model.layers.54.mlp.experts.99.gate_proj", "model.layers.54.mlp.experts.100.gate_proj", "model.layers.54.mlp.experts.101.gate_proj", "model.layers.54.mlp.experts.102.gate_proj", "model.layers.54.mlp.experts.103.gate_proj", "model.layers.54.mlp.experts.104.gate_proj", "model.layers.54.mlp.experts.105.gate_proj", "model.layers.54.mlp.experts.106.gate_proj", "model.layers.54.mlp.experts.107.gate_proj", "model.layers.54.mlp.experts.108.gate_proj", "model.layers.54.mlp.experts.109.gate_proj", "model.layers.54.mlp.experts.110.gate_proj", "model.layers.54.mlp.experts.111.gate_proj", "model.layers.54.mlp.experts.112.gate_proj", "model.layers.54.mlp.experts.113.gate_proj", "model.layers.54.mlp.experts.114.gate_proj", "model.layers.54.mlp.experts.115.gate_proj", "model.layers.54.mlp.experts.116.gate_proj", "model.layers.54.mlp.experts.117.gate_proj", "model.layers.54.mlp.experts.118.gate_proj", "model.layers.54.mlp.experts.119.gate_proj", "model.layers.54.mlp.experts.120.gate_proj", "model.layers.54.mlp.experts.121.gate_proj", "model.layers.54.mlp.experts.122.gate_proj", "model.layers.54.mlp.experts.123.gate_proj", "model.layers.54.mlp.experts.124.gate_proj", "model.layers.54.mlp.experts.125.gate_proj", "model.layers.54.mlp.experts.126.gate_proj", "model.layers.54.mlp.experts.127.gate_proj", "model.layers.54.mlp.experts.128.gate_proj", "model.layers.54.mlp.experts.129.gate_proj", "model.layers.54.mlp.experts.130.gate_proj", "model.layers.54.mlp.experts.131.gate_proj", "model.layers.54.mlp.experts.132.gate_proj", "model.layers.54.mlp.experts.133.gate_proj", "model.layers.54.mlp.experts.134.gate_proj", "model.layers.54.mlp.experts.135.gate_proj", "model.layers.54.mlp.experts.136.gate_proj", "model.layers.54.mlp.experts.137.gate_proj", "model.layers.54.mlp.experts.138.gate_proj", "model.layers.54.mlp.experts.139.gate_proj", "model.layers.54.mlp.experts.140.gate_proj", "model.layers.54.mlp.experts.141.gate_proj", "model.layers.54.mlp.experts.142.gate_proj", "model.layers.54.mlp.experts.143.gate_proj", "model.layers.54.mlp.experts.144.gate_proj", "model.layers.54.mlp.experts.145.gate_proj", "model.layers.54.mlp.experts.146.gate_proj", "model.layers.54.mlp.experts.147.gate_proj", "model.layers.54.mlp.experts.148.gate_proj", "model.layers.54.mlp.experts.149.gate_proj", "model.layers.54.mlp.experts.150.gate_proj", "model.layers.54.mlp.experts.151.gate_proj", "model.layers.54.mlp.experts.152.gate_proj", "model.layers.54.mlp.experts.153.gate_proj", "model.layers.54.mlp.experts.154.gate_proj", "model.layers.54.mlp.experts.155.gate_proj", "model.layers.54.mlp.experts.156.gate_proj", "model.layers.54.mlp.experts.157.gate_proj", "model.layers.54.mlp.experts.158.gate_proj", "model.layers.54.mlp.experts.159.gate_proj", "model.layers.54.mlp.experts.0.up_proj", "model.layers.54.mlp.experts.1.up_proj", "model.layers.54.mlp.experts.2.up_proj", "model.layers.54.mlp.experts.3.up_proj", "model.layers.54.mlp.experts.4.up_proj", "model.layers.54.mlp.experts.5.up_proj", "model.layers.54.mlp.experts.6.up_proj", "model.layers.54.mlp.experts.7.up_proj", "model.layers.54.mlp.experts.8.up_proj", "model.layers.54.mlp.experts.9.up_proj", "model.layers.54.mlp.experts.10.up_proj", "model.layers.54.mlp.experts.11.up_proj", "model.layers.54.mlp.experts.12.up_proj", "model.layers.54.mlp.experts.13.up_proj", "model.layers.54.mlp.experts.14.up_proj", "model.layers.54.mlp.experts.15.up_proj", "model.layers.54.mlp.experts.16.up_proj", "model.layers.54.mlp.experts.17.up_proj", "model.layers.54.mlp.experts.18.up_proj", "model.layers.54.mlp.experts.19.up_proj", "model.layers.54.mlp.experts.20.up_proj", "model.layers.54.mlp.experts.21.up_proj", "model.layers.54.mlp.experts.22.up_proj", "model.layers.54.mlp.experts.23.up_proj", "model.layers.54.mlp.experts.24.up_proj", "model.layers.54.mlp.experts.25.up_proj", "model.layers.54.mlp.experts.26.up_proj", "model.layers.54.mlp.experts.27.up_proj", "model.layers.54.mlp.experts.28.up_proj", "model.layers.54.mlp.experts.29.up_proj", "model.layers.54.mlp.experts.30.up_proj", "model.layers.54.mlp.experts.31.up_proj", "model.layers.54.mlp.experts.32.up_proj", "model.layers.54.mlp.experts.33.up_proj", "model.layers.54.mlp.experts.34.up_proj", "model.layers.54.mlp.experts.35.up_proj", "model.layers.54.mlp.experts.36.up_proj", "model.layers.54.mlp.experts.37.up_proj", "model.layers.54.mlp.experts.38.up_proj", "model.layers.54.mlp.experts.39.up_proj", "model.layers.54.mlp.experts.40.up_proj", "model.layers.54.mlp.experts.41.up_proj", "model.layers.54.mlp.experts.42.up_proj", "model.layers.54.mlp.experts.43.up_proj", "model.layers.54.mlp.experts.44.up_proj", "model.layers.54.mlp.experts.45.up_proj", "model.layers.54.mlp.experts.46.up_proj", "model.layers.54.mlp.experts.47.up_proj", "model.layers.54.mlp.experts.48.up_proj", "model.layers.54.mlp.experts.49.up_proj", "model.layers.54.mlp.experts.50.up_proj", "model.layers.54.mlp.experts.51.up_proj", "model.layers.54.mlp.experts.52.up_proj", "model.layers.54.mlp.experts.53.up_proj", "model.layers.54.mlp.experts.54.up_proj", "model.layers.54.mlp.experts.55.up_proj", "model.layers.54.mlp.experts.56.up_proj", "model.layers.54.mlp.experts.57.up_proj", "model.layers.54.mlp.experts.58.up_proj", "model.layers.54.mlp.experts.59.up_proj", "model.layers.54.mlp.experts.60.up_proj", "model.layers.54.mlp.experts.61.up_proj", "model.layers.54.mlp.experts.62.up_proj", "model.layers.54.mlp.experts.63.up_proj", "model.layers.54.mlp.experts.64.up_proj", "model.layers.54.mlp.experts.65.up_proj", "model.layers.54.mlp.experts.66.up_proj", "model.layers.54.mlp.experts.67.up_proj", "model.layers.54.mlp.experts.68.up_proj", "model.layers.54.mlp.experts.69.up_proj", "model.layers.54.mlp.experts.70.up_proj", "model.layers.54.mlp.experts.71.up_proj", "model.layers.54.mlp.experts.72.up_proj", "model.layers.54.mlp.experts.73.up_proj", "model.layers.54.mlp.experts.74.up_proj", "model.layers.54.mlp.experts.75.up_proj", "model.layers.54.mlp.experts.76.up_proj", "model.layers.54.mlp.experts.77.up_proj", "model.layers.54.mlp.experts.78.up_proj", "model.layers.54.mlp.experts.79.up_proj", "model.layers.54.mlp.experts.80.up_proj", "model.layers.54.mlp.experts.81.up_proj", "model.layers.54.mlp.experts.82.up_proj", "model.layers.54.mlp.experts.83.up_proj", "model.layers.54.mlp.experts.84.up_proj", "model.layers.54.mlp.experts.85.up_proj", "model.layers.54.mlp.experts.86.up_proj", "model.layers.54.mlp.experts.87.up_proj", "model.layers.54.mlp.experts.88.up_proj", "model.layers.54.mlp.experts.89.up_proj", "model.layers.54.mlp.experts.90.up_proj", "model.layers.54.mlp.experts.91.up_proj", "model.layers.54.mlp.experts.92.up_proj", "model.layers.54.mlp.experts.93.up_proj", "model.layers.54.mlp.experts.94.up_proj", "model.layers.54.mlp.experts.95.up_proj", "model.layers.54.mlp.experts.96.up_proj", "model.layers.54.mlp.experts.97.up_proj", "model.layers.54.mlp.experts.98.up_proj", "model.layers.54.mlp.experts.99.up_proj", "model.layers.54.mlp.experts.100.up_proj", "model.layers.54.mlp.experts.101.up_proj", "model.layers.54.mlp.experts.102.up_proj", "model.layers.54.mlp.experts.103.up_proj", "model.layers.54.mlp.experts.104.up_proj", "model.layers.54.mlp.experts.105.up_proj", "model.layers.54.mlp.experts.106.up_proj", "model.layers.54.mlp.experts.107.up_proj", "model.layers.54.mlp.experts.108.up_proj", "model.layers.54.mlp.experts.109.up_proj", "model.layers.54.mlp.experts.110.up_proj", "model.layers.54.mlp.experts.111.up_proj", "model.layers.54.mlp.experts.112.up_proj", "model.layers.54.mlp.experts.113.up_proj", "model.layers.54.mlp.experts.114.up_proj", "model.layers.54.mlp.experts.115.up_proj", "model.layers.54.mlp.experts.116.up_proj", "model.layers.54.mlp.experts.117.up_proj", "model.layers.54.mlp.experts.118.up_proj", "model.layers.54.mlp.experts.119.up_proj", "model.layers.54.mlp.experts.120.up_proj", "model.layers.54.mlp.experts.121.up_proj", "model.layers.54.mlp.experts.122.up_proj", "model.layers.54.mlp.experts.123.up_proj", "model.layers.54.mlp.experts.124.up_proj", "model.layers.54.mlp.experts.125.up_proj", "model.layers.54.mlp.experts.126.up_proj", "model.layers.54.mlp.experts.127.up_proj", "model.layers.54.mlp.experts.128.up_proj", "model.layers.54.mlp.experts.129.up_proj", "model.layers.54.mlp.experts.130.up_proj", "model.layers.54.mlp.experts.131.up_proj", "model.layers.54.mlp.experts.132.up_proj", "model.layers.54.mlp.experts.133.up_proj", "model.layers.54.mlp.experts.134.up_proj", "model.layers.54.mlp.experts.135.up_proj", "model.layers.54.mlp.experts.136.up_proj", "model.layers.54.mlp.experts.137.up_proj", "model.layers.54.mlp.experts.138.up_proj", "model.layers.54.mlp.experts.139.up_proj", "model.layers.54.mlp.experts.140.up_proj", "model.layers.54.mlp.experts.141.up_proj", "model.layers.54.mlp.experts.142.up_proj", "model.layers.54.mlp.experts.143.up_proj", "model.layers.54.mlp.experts.144.up_proj", "model.layers.54.mlp.experts.145.up_proj", "model.layers.54.mlp.experts.146.up_proj", "model.layers.54.mlp.experts.147.up_proj", "model.layers.54.mlp.experts.148.up_proj", "model.layers.54.mlp.experts.149.up_proj", "model.layers.54.mlp.experts.150.up_proj", "model.layers.54.mlp.experts.151.up_proj", "model.layers.54.mlp.experts.152.up_proj", "model.layers.54.mlp.experts.153.up_proj", "model.layers.54.mlp.experts.154.up_proj", "model.layers.54.mlp.experts.155.up_proj", "model.layers.54.mlp.experts.156.up_proj", "model.layers.54.mlp.experts.157.up_proj", "model.layers.54.mlp.experts.158.up_proj", "model.layers.54.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -9.275134652852665e-06, "dbits": 2516582400 }, { "dkld": -4.262872971593987e-06, "dbits": 5033164800 } ] }, { "idx": 326, "layers": [ "model.layers.54.mlp.experts.0.down_proj", "model.layers.54.mlp.experts.1.down_proj", "model.layers.54.mlp.experts.2.down_proj", "model.layers.54.mlp.experts.3.down_proj", "model.layers.54.mlp.experts.4.down_proj", "model.layers.54.mlp.experts.5.down_proj", "model.layers.54.mlp.experts.6.down_proj", "model.layers.54.mlp.experts.7.down_proj", "model.layers.54.mlp.experts.8.down_proj", "model.layers.54.mlp.experts.9.down_proj", "model.layers.54.mlp.experts.10.down_proj", "model.layers.54.mlp.experts.11.down_proj", "model.layers.54.mlp.experts.12.down_proj", "model.layers.54.mlp.experts.13.down_proj", "model.layers.54.mlp.experts.14.down_proj", "model.layers.54.mlp.experts.15.down_proj", "model.layers.54.mlp.experts.16.down_proj", "model.layers.54.mlp.experts.17.down_proj", "model.layers.54.mlp.experts.18.down_proj", "model.layers.54.mlp.experts.19.down_proj", "model.layers.54.mlp.experts.20.down_proj", "model.layers.54.mlp.experts.21.down_proj", "model.layers.54.mlp.experts.22.down_proj", "model.layers.54.mlp.experts.23.down_proj", "model.layers.54.mlp.experts.24.down_proj", "model.layers.54.mlp.experts.25.down_proj", "model.layers.54.mlp.experts.26.down_proj", "model.layers.54.mlp.experts.27.down_proj", "model.layers.54.mlp.experts.28.down_proj", "model.layers.54.mlp.experts.29.down_proj", "model.layers.54.mlp.experts.30.down_proj", "model.layers.54.mlp.experts.31.down_proj", "model.layers.54.mlp.experts.32.down_proj", "model.layers.54.mlp.experts.33.down_proj", "model.layers.54.mlp.experts.34.down_proj", "model.layers.54.mlp.experts.35.down_proj", "model.layers.54.mlp.experts.36.down_proj", "model.layers.54.mlp.experts.37.down_proj", "model.layers.54.mlp.experts.38.down_proj", "model.layers.54.mlp.experts.39.down_proj", "model.layers.54.mlp.experts.40.down_proj", "model.layers.54.mlp.experts.41.down_proj", "model.layers.54.mlp.experts.42.down_proj", "model.layers.54.mlp.experts.43.down_proj", "model.layers.54.mlp.experts.44.down_proj", "model.layers.54.mlp.experts.45.down_proj", "model.layers.54.mlp.experts.46.down_proj", "model.layers.54.mlp.experts.47.down_proj", "model.layers.54.mlp.experts.48.down_proj", "model.layers.54.mlp.experts.49.down_proj", "model.layers.54.mlp.experts.50.down_proj", "model.layers.54.mlp.experts.51.down_proj", "model.layers.54.mlp.experts.52.down_proj", "model.layers.54.mlp.experts.53.down_proj", "model.layers.54.mlp.experts.54.down_proj", "model.layers.54.mlp.experts.55.down_proj", "model.layers.54.mlp.experts.56.down_proj", "model.layers.54.mlp.experts.57.down_proj", "model.layers.54.mlp.experts.58.down_proj", "model.layers.54.mlp.experts.59.down_proj", "model.layers.54.mlp.experts.60.down_proj", "model.layers.54.mlp.experts.61.down_proj", "model.layers.54.mlp.experts.62.down_proj", "model.layers.54.mlp.experts.63.down_proj", "model.layers.54.mlp.experts.64.down_proj", "model.layers.54.mlp.experts.65.down_proj", "model.layers.54.mlp.experts.66.down_proj", "model.layers.54.mlp.experts.67.down_proj", "model.layers.54.mlp.experts.68.down_proj", "model.layers.54.mlp.experts.69.down_proj", "model.layers.54.mlp.experts.70.down_proj", "model.layers.54.mlp.experts.71.down_proj", "model.layers.54.mlp.experts.72.down_proj", "model.layers.54.mlp.experts.73.down_proj", "model.layers.54.mlp.experts.74.down_proj", "model.layers.54.mlp.experts.75.down_proj", "model.layers.54.mlp.experts.76.down_proj", "model.layers.54.mlp.experts.77.down_proj", "model.layers.54.mlp.experts.78.down_proj", "model.layers.54.mlp.experts.79.down_proj", "model.layers.54.mlp.experts.80.down_proj", "model.layers.54.mlp.experts.81.down_proj", "model.layers.54.mlp.experts.82.down_proj", "model.layers.54.mlp.experts.83.down_proj", "model.layers.54.mlp.experts.84.down_proj", "model.layers.54.mlp.experts.85.down_proj", "model.layers.54.mlp.experts.86.down_proj", "model.layers.54.mlp.experts.87.down_proj", "model.layers.54.mlp.experts.88.down_proj", "model.layers.54.mlp.experts.89.down_proj", "model.layers.54.mlp.experts.90.down_proj", "model.layers.54.mlp.experts.91.down_proj", "model.layers.54.mlp.experts.92.down_proj", "model.layers.54.mlp.experts.93.down_proj", "model.layers.54.mlp.experts.94.down_proj", "model.layers.54.mlp.experts.95.down_proj", "model.layers.54.mlp.experts.96.down_proj", "model.layers.54.mlp.experts.97.down_proj", "model.layers.54.mlp.experts.98.down_proj", "model.layers.54.mlp.experts.99.down_proj", "model.layers.54.mlp.experts.100.down_proj", "model.layers.54.mlp.experts.101.down_proj", "model.layers.54.mlp.experts.102.down_proj", "model.layers.54.mlp.experts.103.down_proj", "model.layers.54.mlp.experts.104.down_proj", "model.layers.54.mlp.experts.105.down_proj", "model.layers.54.mlp.experts.106.down_proj", "model.layers.54.mlp.experts.107.down_proj", "model.layers.54.mlp.experts.108.down_proj", "model.layers.54.mlp.experts.109.down_proj", "model.layers.54.mlp.experts.110.down_proj", "model.layers.54.mlp.experts.111.down_proj", "model.layers.54.mlp.experts.112.down_proj", "model.layers.54.mlp.experts.113.down_proj", "model.layers.54.mlp.experts.114.down_proj", "model.layers.54.mlp.experts.115.down_proj", "model.layers.54.mlp.experts.116.down_proj", "model.layers.54.mlp.experts.117.down_proj", "model.layers.54.mlp.experts.118.down_proj", "model.layers.54.mlp.experts.119.down_proj", "model.layers.54.mlp.experts.120.down_proj", "model.layers.54.mlp.experts.121.down_proj", "model.layers.54.mlp.experts.122.down_proj", "model.layers.54.mlp.experts.123.down_proj", "model.layers.54.mlp.experts.124.down_proj", "model.layers.54.mlp.experts.125.down_proj", "model.layers.54.mlp.experts.126.down_proj", "model.layers.54.mlp.experts.127.down_proj", "model.layers.54.mlp.experts.128.down_proj", "model.layers.54.mlp.experts.129.down_proj", "model.layers.54.mlp.experts.130.down_proj", "model.layers.54.mlp.experts.131.down_proj", "model.layers.54.mlp.experts.132.down_proj", "model.layers.54.mlp.experts.133.down_proj", "model.layers.54.mlp.experts.134.down_proj", "model.layers.54.mlp.experts.135.down_proj", "model.layers.54.mlp.experts.136.down_proj", "model.layers.54.mlp.experts.137.down_proj", "model.layers.54.mlp.experts.138.down_proj", "model.layers.54.mlp.experts.139.down_proj", "model.layers.54.mlp.experts.140.down_proj", "model.layers.54.mlp.experts.141.down_proj", "model.layers.54.mlp.experts.142.down_proj", "model.layers.54.mlp.experts.143.down_proj", "model.layers.54.mlp.experts.144.down_proj", "model.layers.54.mlp.experts.145.down_proj", "model.layers.54.mlp.experts.146.down_proj", "model.layers.54.mlp.experts.147.down_proj", "model.layers.54.mlp.experts.148.down_proj", "model.layers.54.mlp.experts.149.down_proj", "model.layers.54.mlp.experts.150.down_proj", "model.layers.54.mlp.experts.151.down_proj", "model.layers.54.mlp.experts.152.down_proj", "model.layers.54.mlp.experts.153.down_proj", "model.layers.54.mlp.experts.154.down_proj", "model.layers.54.mlp.experts.155.down_proj", "model.layers.54.mlp.experts.156.down_proj", "model.layers.54.mlp.experts.157.down_proj", "model.layers.54.mlp.experts.158.down_proj", "model.layers.54.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.6568304747204285e-07, "dbits": 1258291200 }, { "dkld": 1.2503541074694244e-05, "dbits": 2516582400 } ] }, { "idx": 327, "layers": [ "model.layers.55.self_attn.q_proj" ], "candidates": [ { "dkld": 3.9264233782887806e-05, "dbits": 62914560 }, { "dkld": 3.398982807993958e-05, "dbits": 125829120 } ] }, { "idx": 328, "layers": [ "model.layers.55.self_attn.k_proj", "model.layers.55.self_attn.v_proj" ], "candidates": [ { "dkld": 5.102967843413457e-05, "dbits": 10485760 }, { "dkld": 6.161124911159381e-05, "dbits": 20971520 } ] }, { "idx": 329, "layers": [ "model.layers.55.self_attn.o_proj" ], "candidates": [ { "dkld": -9.875139221548687e-06, "dbits": 62914560 }, { "dkld": -1.1104159057129942e-06, "dbits": 125829120 } ] }, { "idx": 330, "layers": [ "model.layers.55.mlp.shared_experts.gate_proj", "model.layers.55.mlp.shared_experts.up_proj", "model.layers.55.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -2.4512736126780163e-05, "dbits": 23592960 }, { "dkld": -1.1996645480393323e-05, "dbits": 47185920 } ] }, { "idx": 331, "layers": [ "model.layers.55.mlp.experts.0.gate_proj", "model.layers.55.mlp.experts.1.gate_proj", "model.layers.55.mlp.experts.2.gate_proj", "model.layers.55.mlp.experts.3.gate_proj", "model.layers.55.mlp.experts.4.gate_proj", "model.layers.55.mlp.experts.5.gate_proj", "model.layers.55.mlp.experts.6.gate_proj", "model.layers.55.mlp.experts.7.gate_proj", "model.layers.55.mlp.experts.8.gate_proj", "model.layers.55.mlp.experts.9.gate_proj", "model.layers.55.mlp.experts.10.gate_proj", "model.layers.55.mlp.experts.11.gate_proj", "model.layers.55.mlp.experts.12.gate_proj", "model.layers.55.mlp.experts.13.gate_proj", "model.layers.55.mlp.experts.14.gate_proj", "model.layers.55.mlp.experts.15.gate_proj", "model.layers.55.mlp.experts.16.gate_proj", "model.layers.55.mlp.experts.17.gate_proj", "model.layers.55.mlp.experts.18.gate_proj", "model.layers.55.mlp.experts.19.gate_proj", "model.layers.55.mlp.experts.20.gate_proj", "model.layers.55.mlp.experts.21.gate_proj", "model.layers.55.mlp.experts.22.gate_proj", "model.layers.55.mlp.experts.23.gate_proj", "model.layers.55.mlp.experts.24.gate_proj", "model.layers.55.mlp.experts.25.gate_proj", "model.layers.55.mlp.experts.26.gate_proj", "model.layers.55.mlp.experts.27.gate_proj", "model.layers.55.mlp.experts.28.gate_proj", "model.layers.55.mlp.experts.29.gate_proj", "model.layers.55.mlp.experts.30.gate_proj", "model.layers.55.mlp.experts.31.gate_proj", "model.layers.55.mlp.experts.32.gate_proj", "model.layers.55.mlp.experts.33.gate_proj", "model.layers.55.mlp.experts.34.gate_proj", "model.layers.55.mlp.experts.35.gate_proj", "model.layers.55.mlp.experts.36.gate_proj", "model.layers.55.mlp.experts.37.gate_proj", "model.layers.55.mlp.experts.38.gate_proj", "model.layers.55.mlp.experts.39.gate_proj", "model.layers.55.mlp.experts.40.gate_proj", "model.layers.55.mlp.experts.41.gate_proj", "model.layers.55.mlp.experts.42.gate_proj", "model.layers.55.mlp.experts.43.gate_proj", "model.layers.55.mlp.experts.44.gate_proj", "model.layers.55.mlp.experts.45.gate_proj", "model.layers.55.mlp.experts.46.gate_proj", "model.layers.55.mlp.experts.47.gate_proj", "model.layers.55.mlp.experts.48.gate_proj", "model.layers.55.mlp.experts.49.gate_proj", "model.layers.55.mlp.experts.50.gate_proj", "model.layers.55.mlp.experts.51.gate_proj", "model.layers.55.mlp.experts.52.gate_proj", "model.layers.55.mlp.experts.53.gate_proj", "model.layers.55.mlp.experts.54.gate_proj", "model.layers.55.mlp.experts.55.gate_proj", "model.layers.55.mlp.experts.56.gate_proj", "model.layers.55.mlp.experts.57.gate_proj", "model.layers.55.mlp.experts.58.gate_proj", "model.layers.55.mlp.experts.59.gate_proj", "model.layers.55.mlp.experts.60.gate_proj", "model.layers.55.mlp.experts.61.gate_proj", "model.layers.55.mlp.experts.62.gate_proj", "model.layers.55.mlp.experts.63.gate_proj", "model.layers.55.mlp.experts.64.gate_proj", "model.layers.55.mlp.experts.65.gate_proj", "model.layers.55.mlp.experts.66.gate_proj", "model.layers.55.mlp.experts.67.gate_proj", "model.layers.55.mlp.experts.68.gate_proj", "model.layers.55.mlp.experts.69.gate_proj", "model.layers.55.mlp.experts.70.gate_proj", "model.layers.55.mlp.experts.71.gate_proj", "model.layers.55.mlp.experts.72.gate_proj", "model.layers.55.mlp.experts.73.gate_proj", "model.layers.55.mlp.experts.74.gate_proj", "model.layers.55.mlp.experts.75.gate_proj", "model.layers.55.mlp.experts.76.gate_proj", "model.layers.55.mlp.experts.77.gate_proj", "model.layers.55.mlp.experts.78.gate_proj", "model.layers.55.mlp.experts.79.gate_proj", "model.layers.55.mlp.experts.80.gate_proj", "model.layers.55.mlp.experts.81.gate_proj", "model.layers.55.mlp.experts.82.gate_proj", "model.layers.55.mlp.experts.83.gate_proj", "model.layers.55.mlp.experts.84.gate_proj", "model.layers.55.mlp.experts.85.gate_proj", "model.layers.55.mlp.experts.86.gate_proj", "model.layers.55.mlp.experts.87.gate_proj", "model.layers.55.mlp.experts.88.gate_proj", "model.layers.55.mlp.experts.89.gate_proj", "model.layers.55.mlp.experts.90.gate_proj", "model.layers.55.mlp.experts.91.gate_proj", "model.layers.55.mlp.experts.92.gate_proj", "model.layers.55.mlp.experts.93.gate_proj", "model.layers.55.mlp.experts.94.gate_proj", "model.layers.55.mlp.experts.95.gate_proj", "model.layers.55.mlp.experts.96.gate_proj", "model.layers.55.mlp.experts.97.gate_proj", "model.layers.55.mlp.experts.98.gate_proj", "model.layers.55.mlp.experts.99.gate_proj", "model.layers.55.mlp.experts.100.gate_proj", "model.layers.55.mlp.experts.101.gate_proj", "model.layers.55.mlp.experts.102.gate_proj", "model.layers.55.mlp.experts.103.gate_proj", "model.layers.55.mlp.experts.104.gate_proj", "model.layers.55.mlp.experts.105.gate_proj", "model.layers.55.mlp.experts.106.gate_proj", "model.layers.55.mlp.experts.107.gate_proj", "model.layers.55.mlp.experts.108.gate_proj", "model.layers.55.mlp.experts.109.gate_proj", "model.layers.55.mlp.experts.110.gate_proj", "model.layers.55.mlp.experts.111.gate_proj", "model.layers.55.mlp.experts.112.gate_proj", "model.layers.55.mlp.experts.113.gate_proj", "model.layers.55.mlp.experts.114.gate_proj", "model.layers.55.mlp.experts.115.gate_proj", "model.layers.55.mlp.experts.116.gate_proj", "model.layers.55.mlp.experts.117.gate_proj", "model.layers.55.mlp.experts.118.gate_proj", "model.layers.55.mlp.experts.119.gate_proj", "model.layers.55.mlp.experts.120.gate_proj", "model.layers.55.mlp.experts.121.gate_proj", "model.layers.55.mlp.experts.122.gate_proj", "model.layers.55.mlp.experts.123.gate_proj", "model.layers.55.mlp.experts.124.gate_proj", "model.layers.55.mlp.experts.125.gate_proj", "model.layers.55.mlp.experts.126.gate_proj", "model.layers.55.mlp.experts.127.gate_proj", "model.layers.55.mlp.experts.128.gate_proj", "model.layers.55.mlp.experts.129.gate_proj", "model.layers.55.mlp.experts.130.gate_proj", "model.layers.55.mlp.experts.131.gate_proj", "model.layers.55.mlp.experts.132.gate_proj", "model.layers.55.mlp.experts.133.gate_proj", "model.layers.55.mlp.experts.134.gate_proj", "model.layers.55.mlp.experts.135.gate_proj", "model.layers.55.mlp.experts.136.gate_proj", "model.layers.55.mlp.experts.137.gate_proj", "model.layers.55.mlp.experts.138.gate_proj", "model.layers.55.mlp.experts.139.gate_proj", "model.layers.55.mlp.experts.140.gate_proj", "model.layers.55.mlp.experts.141.gate_proj", "model.layers.55.mlp.experts.142.gate_proj", "model.layers.55.mlp.experts.143.gate_proj", "model.layers.55.mlp.experts.144.gate_proj", "model.layers.55.mlp.experts.145.gate_proj", "model.layers.55.mlp.experts.146.gate_proj", "model.layers.55.mlp.experts.147.gate_proj", "model.layers.55.mlp.experts.148.gate_proj", "model.layers.55.mlp.experts.149.gate_proj", "model.layers.55.mlp.experts.150.gate_proj", "model.layers.55.mlp.experts.151.gate_proj", "model.layers.55.mlp.experts.152.gate_proj", "model.layers.55.mlp.experts.153.gate_proj", "model.layers.55.mlp.experts.154.gate_proj", "model.layers.55.mlp.experts.155.gate_proj", "model.layers.55.mlp.experts.156.gate_proj", "model.layers.55.mlp.experts.157.gate_proj", "model.layers.55.mlp.experts.158.gate_proj", "model.layers.55.mlp.experts.159.gate_proj", "model.layers.55.mlp.experts.0.up_proj", "model.layers.55.mlp.experts.1.up_proj", "model.layers.55.mlp.experts.2.up_proj", "model.layers.55.mlp.experts.3.up_proj", "model.layers.55.mlp.experts.4.up_proj", "model.layers.55.mlp.experts.5.up_proj", "model.layers.55.mlp.experts.6.up_proj", "model.layers.55.mlp.experts.7.up_proj", "model.layers.55.mlp.experts.8.up_proj", "model.layers.55.mlp.experts.9.up_proj", "model.layers.55.mlp.experts.10.up_proj", "model.layers.55.mlp.experts.11.up_proj", "model.layers.55.mlp.experts.12.up_proj", "model.layers.55.mlp.experts.13.up_proj", "model.layers.55.mlp.experts.14.up_proj", "model.layers.55.mlp.experts.15.up_proj", "model.layers.55.mlp.experts.16.up_proj", "model.layers.55.mlp.experts.17.up_proj", "model.layers.55.mlp.experts.18.up_proj", "model.layers.55.mlp.experts.19.up_proj", "model.layers.55.mlp.experts.20.up_proj", "model.layers.55.mlp.experts.21.up_proj", "model.layers.55.mlp.experts.22.up_proj", "model.layers.55.mlp.experts.23.up_proj", "model.layers.55.mlp.experts.24.up_proj", "model.layers.55.mlp.experts.25.up_proj", "model.layers.55.mlp.experts.26.up_proj", "model.layers.55.mlp.experts.27.up_proj", "model.layers.55.mlp.experts.28.up_proj", "model.layers.55.mlp.experts.29.up_proj", "model.layers.55.mlp.experts.30.up_proj", "model.layers.55.mlp.experts.31.up_proj", "model.layers.55.mlp.experts.32.up_proj", "model.layers.55.mlp.experts.33.up_proj", "model.layers.55.mlp.experts.34.up_proj", "model.layers.55.mlp.experts.35.up_proj", "model.layers.55.mlp.experts.36.up_proj", "model.layers.55.mlp.experts.37.up_proj", "model.layers.55.mlp.experts.38.up_proj", "model.layers.55.mlp.experts.39.up_proj", "model.layers.55.mlp.experts.40.up_proj", "model.layers.55.mlp.experts.41.up_proj", "model.layers.55.mlp.experts.42.up_proj", "model.layers.55.mlp.experts.43.up_proj", "model.layers.55.mlp.experts.44.up_proj", "model.layers.55.mlp.experts.45.up_proj", "model.layers.55.mlp.experts.46.up_proj", "model.layers.55.mlp.experts.47.up_proj", "model.layers.55.mlp.experts.48.up_proj", "model.layers.55.mlp.experts.49.up_proj", "model.layers.55.mlp.experts.50.up_proj", "model.layers.55.mlp.experts.51.up_proj", "model.layers.55.mlp.experts.52.up_proj", "model.layers.55.mlp.experts.53.up_proj", "model.layers.55.mlp.experts.54.up_proj", "model.layers.55.mlp.experts.55.up_proj", "model.layers.55.mlp.experts.56.up_proj", "model.layers.55.mlp.experts.57.up_proj", "model.layers.55.mlp.experts.58.up_proj", "model.layers.55.mlp.experts.59.up_proj", "model.layers.55.mlp.experts.60.up_proj", "model.layers.55.mlp.experts.61.up_proj", "model.layers.55.mlp.experts.62.up_proj", "model.layers.55.mlp.experts.63.up_proj", "model.layers.55.mlp.experts.64.up_proj", "model.layers.55.mlp.experts.65.up_proj", "model.layers.55.mlp.experts.66.up_proj", "model.layers.55.mlp.experts.67.up_proj", "model.layers.55.mlp.experts.68.up_proj", "model.layers.55.mlp.experts.69.up_proj", "model.layers.55.mlp.experts.70.up_proj", "model.layers.55.mlp.experts.71.up_proj", "model.layers.55.mlp.experts.72.up_proj", "model.layers.55.mlp.experts.73.up_proj", "model.layers.55.mlp.experts.74.up_proj", "model.layers.55.mlp.experts.75.up_proj", "model.layers.55.mlp.experts.76.up_proj", "model.layers.55.mlp.experts.77.up_proj", "model.layers.55.mlp.experts.78.up_proj", "model.layers.55.mlp.experts.79.up_proj", "model.layers.55.mlp.experts.80.up_proj", "model.layers.55.mlp.experts.81.up_proj", "model.layers.55.mlp.experts.82.up_proj", "model.layers.55.mlp.experts.83.up_proj", "model.layers.55.mlp.experts.84.up_proj", "model.layers.55.mlp.experts.85.up_proj", "model.layers.55.mlp.experts.86.up_proj", "model.layers.55.mlp.experts.87.up_proj", "model.layers.55.mlp.experts.88.up_proj", "model.layers.55.mlp.experts.89.up_proj", "model.layers.55.mlp.experts.90.up_proj", "model.layers.55.mlp.experts.91.up_proj", "model.layers.55.mlp.experts.92.up_proj", "model.layers.55.mlp.experts.93.up_proj", "model.layers.55.mlp.experts.94.up_proj", "model.layers.55.mlp.experts.95.up_proj", "model.layers.55.mlp.experts.96.up_proj", "model.layers.55.mlp.experts.97.up_proj", "model.layers.55.mlp.experts.98.up_proj", "model.layers.55.mlp.experts.99.up_proj", "model.layers.55.mlp.experts.100.up_proj", "model.layers.55.mlp.experts.101.up_proj", "model.layers.55.mlp.experts.102.up_proj", "model.layers.55.mlp.experts.103.up_proj", "model.layers.55.mlp.experts.104.up_proj", "model.layers.55.mlp.experts.105.up_proj", "model.layers.55.mlp.experts.106.up_proj", "model.layers.55.mlp.experts.107.up_proj", "model.layers.55.mlp.experts.108.up_proj", "model.layers.55.mlp.experts.109.up_proj", "model.layers.55.mlp.experts.110.up_proj", "model.layers.55.mlp.experts.111.up_proj", "model.layers.55.mlp.experts.112.up_proj", "model.layers.55.mlp.experts.113.up_proj", "model.layers.55.mlp.experts.114.up_proj", "model.layers.55.mlp.experts.115.up_proj", "model.layers.55.mlp.experts.116.up_proj", "model.layers.55.mlp.experts.117.up_proj", "model.layers.55.mlp.experts.118.up_proj", "model.layers.55.mlp.experts.119.up_proj", "model.layers.55.mlp.experts.120.up_proj", "model.layers.55.mlp.experts.121.up_proj", "model.layers.55.mlp.experts.122.up_proj", "model.layers.55.mlp.experts.123.up_proj", "model.layers.55.mlp.experts.124.up_proj", "model.layers.55.mlp.experts.125.up_proj", "model.layers.55.mlp.experts.126.up_proj", "model.layers.55.mlp.experts.127.up_proj", "model.layers.55.mlp.experts.128.up_proj", "model.layers.55.mlp.experts.129.up_proj", "model.layers.55.mlp.experts.130.up_proj", "model.layers.55.mlp.experts.131.up_proj", "model.layers.55.mlp.experts.132.up_proj", "model.layers.55.mlp.experts.133.up_proj", "model.layers.55.mlp.experts.134.up_proj", "model.layers.55.mlp.experts.135.up_proj", "model.layers.55.mlp.experts.136.up_proj", "model.layers.55.mlp.experts.137.up_proj", "model.layers.55.mlp.experts.138.up_proj", "model.layers.55.mlp.experts.139.up_proj", "model.layers.55.mlp.experts.140.up_proj", "model.layers.55.mlp.experts.141.up_proj", "model.layers.55.mlp.experts.142.up_proj", "model.layers.55.mlp.experts.143.up_proj", "model.layers.55.mlp.experts.144.up_proj", "model.layers.55.mlp.experts.145.up_proj", "model.layers.55.mlp.experts.146.up_proj", "model.layers.55.mlp.experts.147.up_proj", "model.layers.55.mlp.experts.148.up_proj", "model.layers.55.mlp.experts.149.up_proj", "model.layers.55.mlp.experts.150.up_proj", "model.layers.55.mlp.experts.151.up_proj", "model.layers.55.mlp.experts.152.up_proj", "model.layers.55.mlp.experts.153.up_proj", "model.layers.55.mlp.experts.154.up_proj", "model.layers.55.mlp.experts.155.up_proj", "model.layers.55.mlp.experts.156.up_proj", "model.layers.55.mlp.experts.157.up_proj", "model.layers.55.mlp.experts.158.up_proj", "model.layers.55.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.0062218643724571e-05, "dbits": 2516582400 }, { "dkld": -2.2132345475255402e-05, "dbits": 5033164800 } ] }, { "idx": 332, "layers": [ "model.layers.55.mlp.experts.0.down_proj", "model.layers.55.mlp.experts.1.down_proj", "model.layers.55.mlp.experts.2.down_proj", "model.layers.55.mlp.experts.3.down_proj", "model.layers.55.mlp.experts.4.down_proj", "model.layers.55.mlp.experts.5.down_proj", "model.layers.55.mlp.experts.6.down_proj", "model.layers.55.mlp.experts.7.down_proj", "model.layers.55.mlp.experts.8.down_proj", "model.layers.55.mlp.experts.9.down_proj", "model.layers.55.mlp.experts.10.down_proj", "model.layers.55.mlp.experts.11.down_proj", "model.layers.55.mlp.experts.12.down_proj", "model.layers.55.mlp.experts.13.down_proj", "model.layers.55.mlp.experts.14.down_proj", "model.layers.55.mlp.experts.15.down_proj", "model.layers.55.mlp.experts.16.down_proj", "model.layers.55.mlp.experts.17.down_proj", "model.layers.55.mlp.experts.18.down_proj", "model.layers.55.mlp.experts.19.down_proj", "model.layers.55.mlp.experts.20.down_proj", "model.layers.55.mlp.experts.21.down_proj", "model.layers.55.mlp.experts.22.down_proj", "model.layers.55.mlp.experts.23.down_proj", "model.layers.55.mlp.experts.24.down_proj", "model.layers.55.mlp.experts.25.down_proj", "model.layers.55.mlp.experts.26.down_proj", "model.layers.55.mlp.experts.27.down_proj", "model.layers.55.mlp.experts.28.down_proj", "model.layers.55.mlp.experts.29.down_proj", "model.layers.55.mlp.experts.30.down_proj", "model.layers.55.mlp.experts.31.down_proj", "model.layers.55.mlp.experts.32.down_proj", "model.layers.55.mlp.experts.33.down_proj", "model.layers.55.mlp.experts.34.down_proj", "model.layers.55.mlp.experts.35.down_proj", "model.layers.55.mlp.experts.36.down_proj", "model.layers.55.mlp.experts.37.down_proj", "model.layers.55.mlp.experts.38.down_proj", "model.layers.55.mlp.experts.39.down_proj", "model.layers.55.mlp.experts.40.down_proj", "model.layers.55.mlp.experts.41.down_proj", "model.layers.55.mlp.experts.42.down_proj", "model.layers.55.mlp.experts.43.down_proj", "model.layers.55.mlp.experts.44.down_proj", "model.layers.55.mlp.experts.45.down_proj", "model.layers.55.mlp.experts.46.down_proj", "model.layers.55.mlp.experts.47.down_proj", "model.layers.55.mlp.experts.48.down_proj", "model.layers.55.mlp.experts.49.down_proj", "model.layers.55.mlp.experts.50.down_proj", "model.layers.55.mlp.experts.51.down_proj", "model.layers.55.mlp.experts.52.down_proj", "model.layers.55.mlp.experts.53.down_proj", "model.layers.55.mlp.experts.54.down_proj", "model.layers.55.mlp.experts.55.down_proj", "model.layers.55.mlp.experts.56.down_proj", "model.layers.55.mlp.experts.57.down_proj", "model.layers.55.mlp.experts.58.down_proj", "model.layers.55.mlp.experts.59.down_proj", "model.layers.55.mlp.experts.60.down_proj", "model.layers.55.mlp.experts.61.down_proj", "model.layers.55.mlp.experts.62.down_proj", "model.layers.55.mlp.experts.63.down_proj", "model.layers.55.mlp.experts.64.down_proj", "model.layers.55.mlp.experts.65.down_proj", "model.layers.55.mlp.experts.66.down_proj", "model.layers.55.mlp.experts.67.down_proj", "model.layers.55.mlp.experts.68.down_proj", "model.layers.55.mlp.experts.69.down_proj", "model.layers.55.mlp.experts.70.down_proj", "model.layers.55.mlp.experts.71.down_proj", "model.layers.55.mlp.experts.72.down_proj", "model.layers.55.mlp.experts.73.down_proj", "model.layers.55.mlp.experts.74.down_proj", "model.layers.55.mlp.experts.75.down_proj", "model.layers.55.mlp.experts.76.down_proj", "model.layers.55.mlp.experts.77.down_proj", "model.layers.55.mlp.experts.78.down_proj", "model.layers.55.mlp.experts.79.down_proj", "model.layers.55.mlp.experts.80.down_proj", "model.layers.55.mlp.experts.81.down_proj", "model.layers.55.mlp.experts.82.down_proj", "model.layers.55.mlp.experts.83.down_proj", "model.layers.55.mlp.experts.84.down_proj", "model.layers.55.mlp.experts.85.down_proj", "model.layers.55.mlp.experts.86.down_proj", "model.layers.55.mlp.experts.87.down_proj", "model.layers.55.mlp.experts.88.down_proj", "model.layers.55.mlp.experts.89.down_proj", "model.layers.55.mlp.experts.90.down_proj", "model.layers.55.mlp.experts.91.down_proj", "model.layers.55.mlp.experts.92.down_proj", "model.layers.55.mlp.experts.93.down_proj", "model.layers.55.mlp.experts.94.down_proj", "model.layers.55.mlp.experts.95.down_proj", "model.layers.55.mlp.experts.96.down_proj", "model.layers.55.mlp.experts.97.down_proj", "model.layers.55.mlp.experts.98.down_proj", "model.layers.55.mlp.experts.99.down_proj", "model.layers.55.mlp.experts.100.down_proj", "model.layers.55.mlp.experts.101.down_proj", "model.layers.55.mlp.experts.102.down_proj", "model.layers.55.mlp.experts.103.down_proj", "model.layers.55.mlp.experts.104.down_proj", "model.layers.55.mlp.experts.105.down_proj", "model.layers.55.mlp.experts.106.down_proj", "model.layers.55.mlp.experts.107.down_proj", "model.layers.55.mlp.experts.108.down_proj", "model.layers.55.mlp.experts.109.down_proj", "model.layers.55.mlp.experts.110.down_proj", "model.layers.55.mlp.experts.111.down_proj", "model.layers.55.mlp.experts.112.down_proj", "model.layers.55.mlp.experts.113.down_proj", "model.layers.55.mlp.experts.114.down_proj", "model.layers.55.mlp.experts.115.down_proj", "model.layers.55.mlp.experts.116.down_proj", "model.layers.55.mlp.experts.117.down_proj", "model.layers.55.mlp.experts.118.down_proj", "model.layers.55.mlp.experts.119.down_proj", "model.layers.55.mlp.experts.120.down_proj", "model.layers.55.mlp.experts.121.down_proj", "model.layers.55.mlp.experts.122.down_proj", "model.layers.55.mlp.experts.123.down_proj", "model.layers.55.mlp.experts.124.down_proj", "model.layers.55.mlp.experts.125.down_proj", "model.layers.55.mlp.experts.126.down_proj", "model.layers.55.mlp.experts.127.down_proj", "model.layers.55.mlp.experts.128.down_proj", "model.layers.55.mlp.experts.129.down_proj", "model.layers.55.mlp.experts.130.down_proj", "model.layers.55.mlp.experts.131.down_proj", "model.layers.55.mlp.experts.132.down_proj", "model.layers.55.mlp.experts.133.down_proj", "model.layers.55.mlp.experts.134.down_proj", "model.layers.55.mlp.experts.135.down_proj", "model.layers.55.mlp.experts.136.down_proj", "model.layers.55.mlp.experts.137.down_proj", "model.layers.55.mlp.experts.138.down_proj", "model.layers.55.mlp.experts.139.down_proj", "model.layers.55.mlp.experts.140.down_proj", "model.layers.55.mlp.experts.141.down_proj", "model.layers.55.mlp.experts.142.down_proj", "model.layers.55.mlp.experts.143.down_proj", "model.layers.55.mlp.experts.144.down_proj", "model.layers.55.mlp.experts.145.down_proj", "model.layers.55.mlp.experts.146.down_proj", "model.layers.55.mlp.experts.147.down_proj", "model.layers.55.mlp.experts.148.down_proj", "model.layers.55.mlp.experts.149.down_proj", "model.layers.55.mlp.experts.150.down_proj", "model.layers.55.mlp.experts.151.down_proj", "model.layers.55.mlp.experts.152.down_proj", "model.layers.55.mlp.experts.153.down_proj", "model.layers.55.mlp.experts.154.down_proj", "model.layers.55.mlp.experts.155.down_proj", "model.layers.55.mlp.experts.156.down_proj", "model.layers.55.mlp.experts.157.down_proj", "model.layers.55.mlp.experts.158.down_proj", "model.layers.55.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.8182053938494156e-06, "dbits": 1258291200 }, { "dkld": 4.070182330907432e-06, "dbits": 2516582400 } ] }, { "idx": 333, "layers": [ "model.layers.56.self_attn.q_proj" ], "candidates": [ { "dkld": 7.904390804469932e-06, "dbits": 62914560 }, { "dkld": -5.388213321565541e-06, "dbits": 125829120 } ] }, { "idx": 334, "layers": [ "model.layers.56.self_attn.k_proj", "model.layers.56.self_attn.v_proj" ], "candidates": [ { "dkld": 5.234910640865634e-05, "dbits": 10485760 }, { "dkld": 5.756495520472561e-05, "dbits": 20971520 } ] }, { "idx": 335, "layers": [ "model.layers.56.self_attn.o_proj" ], "candidates": [ { "dkld": 7.741106674076167e-06, "dbits": 62914560 }, { "dkld": 1.1517852544785587e-05, "dbits": 125829120 } ] }, { "idx": 336, "layers": [ "model.layers.56.mlp.shared_experts.gate_proj", "model.layers.56.mlp.shared_experts.up_proj", "model.layers.56.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -1.5408685430883667e-05, "dbits": 23592960 }, { "dkld": 9.649945423007705e-06, "dbits": 47185920 } ] }, { "idx": 337, "layers": [ "model.layers.56.mlp.experts.0.gate_proj", "model.layers.56.mlp.experts.1.gate_proj", "model.layers.56.mlp.experts.2.gate_proj", "model.layers.56.mlp.experts.3.gate_proj", "model.layers.56.mlp.experts.4.gate_proj", "model.layers.56.mlp.experts.5.gate_proj", "model.layers.56.mlp.experts.6.gate_proj", "model.layers.56.mlp.experts.7.gate_proj", "model.layers.56.mlp.experts.8.gate_proj", "model.layers.56.mlp.experts.9.gate_proj", "model.layers.56.mlp.experts.10.gate_proj", "model.layers.56.mlp.experts.11.gate_proj", "model.layers.56.mlp.experts.12.gate_proj", "model.layers.56.mlp.experts.13.gate_proj", "model.layers.56.mlp.experts.14.gate_proj", "model.layers.56.mlp.experts.15.gate_proj", "model.layers.56.mlp.experts.16.gate_proj", "model.layers.56.mlp.experts.17.gate_proj", "model.layers.56.mlp.experts.18.gate_proj", "model.layers.56.mlp.experts.19.gate_proj", "model.layers.56.mlp.experts.20.gate_proj", "model.layers.56.mlp.experts.21.gate_proj", "model.layers.56.mlp.experts.22.gate_proj", "model.layers.56.mlp.experts.23.gate_proj", "model.layers.56.mlp.experts.24.gate_proj", "model.layers.56.mlp.experts.25.gate_proj", "model.layers.56.mlp.experts.26.gate_proj", "model.layers.56.mlp.experts.27.gate_proj", "model.layers.56.mlp.experts.28.gate_proj", "model.layers.56.mlp.experts.29.gate_proj", "model.layers.56.mlp.experts.30.gate_proj", "model.layers.56.mlp.experts.31.gate_proj", "model.layers.56.mlp.experts.32.gate_proj", "model.layers.56.mlp.experts.33.gate_proj", "model.layers.56.mlp.experts.34.gate_proj", "model.layers.56.mlp.experts.35.gate_proj", "model.layers.56.mlp.experts.36.gate_proj", "model.layers.56.mlp.experts.37.gate_proj", "model.layers.56.mlp.experts.38.gate_proj", "model.layers.56.mlp.experts.39.gate_proj", "model.layers.56.mlp.experts.40.gate_proj", "model.layers.56.mlp.experts.41.gate_proj", "model.layers.56.mlp.experts.42.gate_proj", "model.layers.56.mlp.experts.43.gate_proj", "model.layers.56.mlp.experts.44.gate_proj", "model.layers.56.mlp.experts.45.gate_proj", "model.layers.56.mlp.experts.46.gate_proj", "model.layers.56.mlp.experts.47.gate_proj", "model.layers.56.mlp.experts.48.gate_proj", "model.layers.56.mlp.experts.49.gate_proj", "model.layers.56.mlp.experts.50.gate_proj", "model.layers.56.mlp.experts.51.gate_proj", "model.layers.56.mlp.experts.52.gate_proj", "model.layers.56.mlp.experts.53.gate_proj", "model.layers.56.mlp.experts.54.gate_proj", "model.layers.56.mlp.experts.55.gate_proj", "model.layers.56.mlp.experts.56.gate_proj", "model.layers.56.mlp.experts.57.gate_proj", "model.layers.56.mlp.experts.58.gate_proj", "model.layers.56.mlp.experts.59.gate_proj", "model.layers.56.mlp.experts.60.gate_proj", "model.layers.56.mlp.experts.61.gate_proj", "model.layers.56.mlp.experts.62.gate_proj", "model.layers.56.mlp.experts.63.gate_proj", "model.layers.56.mlp.experts.64.gate_proj", "model.layers.56.mlp.experts.65.gate_proj", "model.layers.56.mlp.experts.66.gate_proj", "model.layers.56.mlp.experts.67.gate_proj", "model.layers.56.mlp.experts.68.gate_proj", "model.layers.56.mlp.experts.69.gate_proj", "model.layers.56.mlp.experts.70.gate_proj", "model.layers.56.mlp.experts.71.gate_proj", "model.layers.56.mlp.experts.72.gate_proj", "model.layers.56.mlp.experts.73.gate_proj", "model.layers.56.mlp.experts.74.gate_proj", "model.layers.56.mlp.experts.75.gate_proj", "model.layers.56.mlp.experts.76.gate_proj", "model.layers.56.mlp.experts.77.gate_proj", "model.layers.56.mlp.experts.78.gate_proj", "model.layers.56.mlp.experts.79.gate_proj", "model.layers.56.mlp.experts.80.gate_proj", "model.layers.56.mlp.experts.81.gate_proj", "model.layers.56.mlp.experts.82.gate_proj", "model.layers.56.mlp.experts.83.gate_proj", "model.layers.56.mlp.experts.84.gate_proj", "model.layers.56.mlp.experts.85.gate_proj", "model.layers.56.mlp.experts.86.gate_proj", "model.layers.56.mlp.experts.87.gate_proj", "model.layers.56.mlp.experts.88.gate_proj", "model.layers.56.mlp.experts.89.gate_proj", "model.layers.56.mlp.experts.90.gate_proj", "model.layers.56.mlp.experts.91.gate_proj", "model.layers.56.mlp.experts.92.gate_proj", "model.layers.56.mlp.experts.93.gate_proj", "model.layers.56.mlp.experts.94.gate_proj", "model.layers.56.mlp.experts.95.gate_proj", "model.layers.56.mlp.experts.96.gate_proj", "model.layers.56.mlp.experts.97.gate_proj", "model.layers.56.mlp.experts.98.gate_proj", "model.layers.56.mlp.experts.99.gate_proj", "model.layers.56.mlp.experts.100.gate_proj", "model.layers.56.mlp.experts.101.gate_proj", "model.layers.56.mlp.experts.102.gate_proj", "model.layers.56.mlp.experts.103.gate_proj", "model.layers.56.mlp.experts.104.gate_proj", "model.layers.56.mlp.experts.105.gate_proj", "model.layers.56.mlp.experts.106.gate_proj", "model.layers.56.mlp.experts.107.gate_proj", "model.layers.56.mlp.experts.108.gate_proj", "model.layers.56.mlp.experts.109.gate_proj", "model.layers.56.mlp.experts.110.gate_proj", "model.layers.56.mlp.experts.111.gate_proj", "model.layers.56.mlp.experts.112.gate_proj", "model.layers.56.mlp.experts.113.gate_proj", "model.layers.56.mlp.experts.114.gate_proj", "model.layers.56.mlp.experts.115.gate_proj", "model.layers.56.mlp.experts.116.gate_proj", "model.layers.56.mlp.experts.117.gate_proj", "model.layers.56.mlp.experts.118.gate_proj", "model.layers.56.mlp.experts.119.gate_proj", "model.layers.56.mlp.experts.120.gate_proj", "model.layers.56.mlp.experts.121.gate_proj", "model.layers.56.mlp.experts.122.gate_proj", "model.layers.56.mlp.experts.123.gate_proj", "model.layers.56.mlp.experts.124.gate_proj", "model.layers.56.mlp.experts.125.gate_proj", "model.layers.56.mlp.experts.126.gate_proj", "model.layers.56.mlp.experts.127.gate_proj", "model.layers.56.mlp.experts.128.gate_proj", "model.layers.56.mlp.experts.129.gate_proj", "model.layers.56.mlp.experts.130.gate_proj", "model.layers.56.mlp.experts.131.gate_proj", "model.layers.56.mlp.experts.132.gate_proj", "model.layers.56.mlp.experts.133.gate_proj", "model.layers.56.mlp.experts.134.gate_proj", "model.layers.56.mlp.experts.135.gate_proj", "model.layers.56.mlp.experts.136.gate_proj", "model.layers.56.mlp.experts.137.gate_proj", "model.layers.56.mlp.experts.138.gate_proj", "model.layers.56.mlp.experts.139.gate_proj", "model.layers.56.mlp.experts.140.gate_proj", "model.layers.56.mlp.experts.141.gate_proj", "model.layers.56.mlp.experts.142.gate_proj", "model.layers.56.mlp.experts.143.gate_proj", "model.layers.56.mlp.experts.144.gate_proj", "model.layers.56.mlp.experts.145.gate_proj", "model.layers.56.mlp.experts.146.gate_proj", "model.layers.56.mlp.experts.147.gate_proj", "model.layers.56.mlp.experts.148.gate_proj", "model.layers.56.mlp.experts.149.gate_proj", "model.layers.56.mlp.experts.150.gate_proj", "model.layers.56.mlp.experts.151.gate_proj", "model.layers.56.mlp.experts.152.gate_proj", "model.layers.56.mlp.experts.153.gate_proj", "model.layers.56.mlp.experts.154.gate_proj", "model.layers.56.mlp.experts.155.gate_proj", "model.layers.56.mlp.experts.156.gate_proj", "model.layers.56.mlp.experts.157.gate_proj", "model.layers.56.mlp.experts.158.gate_proj", "model.layers.56.mlp.experts.159.gate_proj", "model.layers.56.mlp.experts.0.up_proj", "model.layers.56.mlp.experts.1.up_proj", "model.layers.56.mlp.experts.2.up_proj", "model.layers.56.mlp.experts.3.up_proj", "model.layers.56.mlp.experts.4.up_proj", "model.layers.56.mlp.experts.5.up_proj", "model.layers.56.mlp.experts.6.up_proj", "model.layers.56.mlp.experts.7.up_proj", "model.layers.56.mlp.experts.8.up_proj", "model.layers.56.mlp.experts.9.up_proj", "model.layers.56.mlp.experts.10.up_proj", "model.layers.56.mlp.experts.11.up_proj", "model.layers.56.mlp.experts.12.up_proj", "model.layers.56.mlp.experts.13.up_proj", "model.layers.56.mlp.experts.14.up_proj", "model.layers.56.mlp.experts.15.up_proj", "model.layers.56.mlp.experts.16.up_proj", "model.layers.56.mlp.experts.17.up_proj", "model.layers.56.mlp.experts.18.up_proj", "model.layers.56.mlp.experts.19.up_proj", "model.layers.56.mlp.experts.20.up_proj", "model.layers.56.mlp.experts.21.up_proj", "model.layers.56.mlp.experts.22.up_proj", "model.layers.56.mlp.experts.23.up_proj", "model.layers.56.mlp.experts.24.up_proj", "model.layers.56.mlp.experts.25.up_proj", "model.layers.56.mlp.experts.26.up_proj", "model.layers.56.mlp.experts.27.up_proj", "model.layers.56.mlp.experts.28.up_proj", "model.layers.56.mlp.experts.29.up_proj", "model.layers.56.mlp.experts.30.up_proj", "model.layers.56.mlp.experts.31.up_proj", "model.layers.56.mlp.experts.32.up_proj", "model.layers.56.mlp.experts.33.up_proj", "model.layers.56.mlp.experts.34.up_proj", "model.layers.56.mlp.experts.35.up_proj", "model.layers.56.mlp.experts.36.up_proj", "model.layers.56.mlp.experts.37.up_proj", "model.layers.56.mlp.experts.38.up_proj", "model.layers.56.mlp.experts.39.up_proj", "model.layers.56.mlp.experts.40.up_proj", "model.layers.56.mlp.experts.41.up_proj", "model.layers.56.mlp.experts.42.up_proj", "model.layers.56.mlp.experts.43.up_proj", "model.layers.56.mlp.experts.44.up_proj", "model.layers.56.mlp.experts.45.up_proj", "model.layers.56.mlp.experts.46.up_proj", "model.layers.56.mlp.experts.47.up_proj", "model.layers.56.mlp.experts.48.up_proj", "model.layers.56.mlp.experts.49.up_proj", "model.layers.56.mlp.experts.50.up_proj", "model.layers.56.mlp.experts.51.up_proj", "model.layers.56.mlp.experts.52.up_proj", "model.layers.56.mlp.experts.53.up_proj", "model.layers.56.mlp.experts.54.up_proj", "model.layers.56.mlp.experts.55.up_proj", "model.layers.56.mlp.experts.56.up_proj", "model.layers.56.mlp.experts.57.up_proj", "model.layers.56.mlp.experts.58.up_proj", "model.layers.56.mlp.experts.59.up_proj", "model.layers.56.mlp.experts.60.up_proj", "model.layers.56.mlp.experts.61.up_proj", "model.layers.56.mlp.experts.62.up_proj", "model.layers.56.mlp.experts.63.up_proj", "model.layers.56.mlp.experts.64.up_proj", "model.layers.56.mlp.experts.65.up_proj", "model.layers.56.mlp.experts.66.up_proj", "model.layers.56.mlp.experts.67.up_proj", "model.layers.56.mlp.experts.68.up_proj", "model.layers.56.mlp.experts.69.up_proj", "model.layers.56.mlp.experts.70.up_proj", "model.layers.56.mlp.experts.71.up_proj", "model.layers.56.mlp.experts.72.up_proj", "model.layers.56.mlp.experts.73.up_proj", "model.layers.56.mlp.experts.74.up_proj", "model.layers.56.mlp.experts.75.up_proj", "model.layers.56.mlp.experts.76.up_proj", "model.layers.56.mlp.experts.77.up_proj", "model.layers.56.mlp.experts.78.up_proj", "model.layers.56.mlp.experts.79.up_proj", "model.layers.56.mlp.experts.80.up_proj", "model.layers.56.mlp.experts.81.up_proj", "model.layers.56.mlp.experts.82.up_proj", "model.layers.56.mlp.experts.83.up_proj", "model.layers.56.mlp.experts.84.up_proj", "model.layers.56.mlp.experts.85.up_proj", "model.layers.56.mlp.experts.86.up_proj", "model.layers.56.mlp.experts.87.up_proj", "model.layers.56.mlp.experts.88.up_proj", "model.layers.56.mlp.experts.89.up_proj", "model.layers.56.mlp.experts.90.up_proj", "model.layers.56.mlp.experts.91.up_proj", "model.layers.56.mlp.experts.92.up_proj", "model.layers.56.mlp.experts.93.up_proj", "model.layers.56.mlp.experts.94.up_proj", "model.layers.56.mlp.experts.95.up_proj", "model.layers.56.mlp.experts.96.up_proj", "model.layers.56.mlp.experts.97.up_proj", "model.layers.56.mlp.experts.98.up_proj", "model.layers.56.mlp.experts.99.up_proj", "model.layers.56.mlp.experts.100.up_proj", "model.layers.56.mlp.experts.101.up_proj", "model.layers.56.mlp.experts.102.up_proj", "model.layers.56.mlp.experts.103.up_proj", "model.layers.56.mlp.experts.104.up_proj", "model.layers.56.mlp.experts.105.up_proj", "model.layers.56.mlp.experts.106.up_proj", "model.layers.56.mlp.experts.107.up_proj", "model.layers.56.mlp.experts.108.up_proj", "model.layers.56.mlp.experts.109.up_proj", "model.layers.56.mlp.experts.110.up_proj", "model.layers.56.mlp.experts.111.up_proj", "model.layers.56.mlp.experts.112.up_proj", "model.layers.56.mlp.experts.113.up_proj", "model.layers.56.mlp.experts.114.up_proj", "model.layers.56.mlp.experts.115.up_proj", "model.layers.56.mlp.experts.116.up_proj", "model.layers.56.mlp.experts.117.up_proj", "model.layers.56.mlp.experts.118.up_proj", "model.layers.56.mlp.experts.119.up_proj", "model.layers.56.mlp.experts.120.up_proj", "model.layers.56.mlp.experts.121.up_proj", "model.layers.56.mlp.experts.122.up_proj", "model.layers.56.mlp.experts.123.up_proj", "model.layers.56.mlp.experts.124.up_proj", "model.layers.56.mlp.experts.125.up_proj", "model.layers.56.mlp.experts.126.up_proj", "model.layers.56.mlp.experts.127.up_proj", "model.layers.56.mlp.experts.128.up_proj", "model.layers.56.mlp.experts.129.up_proj", "model.layers.56.mlp.experts.130.up_proj", "model.layers.56.mlp.experts.131.up_proj", "model.layers.56.mlp.experts.132.up_proj", "model.layers.56.mlp.experts.133.up_proj", "model.layers.56.mlp.experts.134.up_proj", "model.layers.56.mlp.experts.135.up_proj", "model.layers.56.mlp.experts.136.up_proj", "model.layers.56.mlp.experts.137.up_proj", "model.layers.56.mlp.experts.138.up_proj", "model.layers.56.mlp.experts.139.up_proj", "model.layers.56.mlp.experts.140.up_proj", "model.layers.56.mlp.experts.141.up_proj", "model.layers.56.mlp.experts.142.up_proj", "model.layers.56.mlp.experts.143.up_proj", "model.layers.56.mlp.experts.144.up_proj", "model.layers.56.mlp.experts.145.up_proj", "model.layers.56.mlp.experts.146.up_proj", "model.layers.56.mlp.experts.147.up_proj", "model.layers.56.mlp.experts.148.up_proj", "model.layers.56.mlp.experts.149.up_proj", "model.layers.56.mlp.experts.150.up_proj", "model.layers.56.mlp.experts.151.up_proj", "model.layers.56.mlp.experts.152.up_proj", "model.layers.56.mlp.experts.153.up_proj", "model.layers.56.mlp.experts.154.up_proj", "model.layers.56.mlp.experts.155.up_proj", "model.layers.56.mlp.experts.156.up_proj", "model.layers.56.mlp.experts.157.up_proj", "model.layers.56.mlp.experts.158.up_proj", "model.layers.56.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.576214563101669e-05, "dbits": 2516582400 }, { "dkld": -1.0192859917872166e-06, "dbits": 5033164800 } ] }, { "idx": 338, "layers": [ "model.layers.56.mlp.experts.0.down_proj", "model.layers.56.mlp.experts.1.down_proj", "model.layers.56.mlp.experts.2.down_proj", "model.layers.56.mlp.experts.3.down_proj", "model.layers.56.mlp.experts.4.down_proj", "model.layers.56.mlp.experts.5.down_proj", "model.layers.56.mlp.experts.6.down_proj", "model.layers.56.mlp.experts.7.down_proj", "model.layers.56.mlp.experts.8.down_proj", "model.layers.56.mlp.experts.9.down_proj", "model.layers.56.mlp.experts.10.down_proj", "model.layers.56.mlp.experts.11.down_proj", "model.layers.56.mlp.experts.12.down_proj", "model.layers.56.mlp.experts.13.down_proj", "model.layers.56.mlp.experts.14.down_proj", "model.layers.56.mlp.experts.15.down_proj", "model.layers.56.mlp.experts.16.down_proj", "model.layers.56.mlp.experts.17.down_proj", "model.layers.56.mlp.experts.18.down_proj", "model.layers.56.mlp.experts.19.down_proj", "model.layers.56.mlp.experts.20.down_proj", "model.layers.56.mlp.experts.21.down_proj", "model.layers.56.mlp.experts.22.down_proj", "model.layers.56.mlp.experts.23.down_proj", "model.layers.56.mlp.experts.24.down_proj", "model.layers.56.mlp.experts.25.down_proj", "model.layers.56.mlp.experts.26.down_proj", "model.layers.56.mlp.experts.27.down_proj", "model.layers.56.mlp.experts.28.down_proj", "model.layers.56.mlp.experts.29.down_proj", "model.layers.56.mlp.experts.30.down_proj", "model.layers.56.mlp.experts.31.down_proj", "model.layers.56.mlp.experts.32.down_proj", "model.layers.56.mlp.experts.33.down_proj", "model.layers.56.mlp.experts.34.down_proj", "model.layers.56.mlp.experts.35.down_proj", "model.layers.56.mlp.experts.36.down_proj", "model.layers.56.mlp.experts.37.down_proj", "model.layers.56.mlp.experts.38.down_proj", "model.layers.56.mlp.experts.39.down_proj", "model.layers.56.mlp.experts.40.down_proj", "model.layers.56.mlp.experts.41.down_proj", "model.layers.56.mlp.experts.42.down_proj", "model.layers.56.mlp.experts.43.down_proj", "model.layers.56.mlp.experts.44.down_proj", "model.layers.56.mlp.experts.45.down_proj", "model.layers.56.mlp.experts.46.down_proj", "model.layers.56.mlp.experts.47.down_proj", "model.layers.56.mlp.experts.48.down_proj", "model.layers.56.mlp.experts.49.down_proj", "model.layers.56.mlp.experts.50.down_proj", "model.layers.56.mlp.experts.51.down_proj", "model.layers.56.mlp.experts.52.down_proj", "model.layers.56.mlp.experts.53.down_proj", "model.layers.56.mlp.experts.54.down_proj", "model.layers.56.mlp.experts.55.down_proj", "model.layers.56.mlp.experts.56.down_proj", "model.layers.56.mlp.experts.57.down_proj", "model.layers.56.mlp.experts.58.down_proj", "model.layers.56.mlp.experts.59.down_proj", "model.layers.56.mlp.experts.60.down_proj", "model.layers.56.mlp.experts.61.down_proj", "model.layers.56.mlp.experts.62.down_proj", "model.layers.56.mlp.experts.63.down_proj", "model.layers.56.mlp.experts.64.down_proj", "model.layers.56.mlp.experts.65.down_proj", "model.layers.56.mlp.experts.66.down_proj", "model.layers.56.mlp.experts.67.down_proj", "model.layers.56.mlp.experts.68.down_proj", "model.layers.56.mlp.experts.69.down_proj", "model.layers.56.mlp.experts.70.down_proj", "model.layers.56.mlp.experts.71.down_proj", "model.layers.56.mlp.experts.72.down_proj", "model.layers.56.mlp.experts.73.down_proj", "model.layers.56.mlp.experts.74.down_proj", "model.layers.56.mlp.experts.75.down_proj", "model.layers.56.mlp.experts.76.down_proj", "model.layers.56.mlp.experts.77.down_proj", "model.layers.56.mlp.experts.78.down_proj", "model.layers.56.mlp.experts.79.down_proj", "model.layers.56.mlp.experts.80.down_proj", "model.layers.56.mlp.experts.81.down_proj", "model.layers.56.mlp.experts.82.down_proj", "model.layers.56.mlp.experts.83.down_proj", "model.layers.56.mlp.experts.84.down_proj", "model.layers.56.mlp.experts.85.down_proj", "model.layers.56.mlp.experts.86.down_proj", "model.layers.56.mlp.experts.87.down_proj", "model.layers.56.mlp.experts.88.down_proj", "model.layers.56.mlp.experts.89.down_proj", "model.layers.56.mlp.experts.90.down_proj", "model.layers.56.mlp.experts.91.down_proj", "model.layers.56.mlp.experts.92.down_proj", "model.layers.56.mlp.experts.93.down_proj", "model.layers.56.mlp.experts.94.down_proj", "model.layers.56.mlp.experts.95.down_proj", "model.layers.56.mlp.experts.96.down_proj", "model.layers.56.mlp.experts.97.down_proj", "model.layers.56.mlp.experts.98.down_proj", "model.layers.56.mlp.experts.99.down_proj", "model.layers.56.mlp.experts.100.down_proj", "model.layers.56.mlp.experts.101.down_proj", "model.layers.56.mlp.experts.102.down_proj", "model.layers.56.mlp.experts.103.down_proj", "model.layers.56.mlp.experts.104.down_proj", "model.layers.56.mlp.experts.105.down_proj", "model.layers.56.mlp.experts.106.down_proj", "model.layers.56.mlp.experts.107.down_proj", "model.layers.56.mlp.experts.108.down_proj", "model.layers.56.mlp.experts.109.down_proj", "model.layers.56.mlp.experts.110.down_proj", "model.layers.56.mlp.experts.111.down_proj", "model.layers.56.mlp.experts.112.down_proj", "model.layers.56.mlp.experts.113.down_proj", "model.layers.56.mlp.experts.114.down_proj", "model.layers.56.mlp.experts.115.down_proj", "model.layers.56.mlp.experts.116.down_proj", "model.layers.56.mlp.experts.117.down_proj", "model.layers.56.mlp.experts.118.down_proj", "model.layers.56.mlp.experts.119.down_proj", "model.layers.56.mlp.experts.120.down_proj", "model.layers.56.mlp.experts.121.down_proj", "model.layers.56.mlp.experts.122.down_proj", "model.layers.56.mlp.experts.123.down_proj", "model.layers.56.mlp.experts.124.down_proj", "model.layers.56.mlp.experts.125.down_proj", "model.layers.56.mlp.experts.126.down_proj", "model.layers.56.mlp.experts.127.down_proj", "model.layers.56.mlp.experts.128.down_proj", "model.layers.56.mlp.experts.129.down_proj", "model.layers.56.mlp.experts.130.down_proj", "model.layers.56.mlp.experts.131.down_proj", "model.layers.56.mlp.experts.132.down_proj", "model.layers.56.mlp.experts.133.down_proj", "model.layers.56.mlp.experts.134.down_proj", "model.layers.56.mlp.experts.135.down_proj", "model.layers.56.mlp.experts.136.down_proj", "model.layers.56.mlp.experts.137.down_proj", "model.layers.56.mlp.experts.138.down_proj", "model.layers.56.mlp.experts.139.down_proj", "model.layers.56.mlp.experts.140.down_proj", "model.layers.56.mlp.experts.141.down_proj", "model.layers.56.mlp.experts.142.down_proj", "model.layers.56.mlp.experts.143.down_proj", "model.layers.56.mlp.experts.144.down_proj", "model.layers.56.mlp.experts.145.down_proj", "model.layers.56.mlp.experts.146.down_proj", "model.layers.56.mlp.experts.147.down_proj", "model.layers.56.mlp.experts.148.down_proj", "model.layers.56.mlp.experts.149.down_proj", "model.layers.56.mlp.experts.150.down_proj", "model.layers.56.mlp.experts.151.down_proj", "model.layers.56.mlp.experts.152.down_proj", "model.layers.56.mlp.experts.153.down_proj", "model.layers.56.mlp.experts.154.down_proj", "model.layers.56.mlp.experts.155.down_proj", "model.layers.56.mlp.experts.156.down_proj", "model.layers.56.mlp.experts.157.down_proj", "model.layers.56.mlp.experts.158.down_proj", "model.layers.56.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 4.547997377812862e-06, "dbits": 1258291200 }, { "dkld": 4.084734246135799e-06, "dbits": 2516582400 } ] }, { "idx": 339, "layers": [ "model.layers.57.self_attn.q_proj" ], "candidates": [ { "dkld": 1.5081488527357578e-05, "dbits": 62914560 }, { "dkld": 9.937351569533695e-06, "dbits": 125829120 } ] }, { "idx": 340, "layers": [ "model.layers.57.self_attn.k_proj", "model.layers.57.self_attn.v_proj" ], "candidates": [ { "dkld": -1.0978011414407643e-05, "dbits": 10485760 }, { "dkld": -9.66899096965096e-07, "dbits": 20971520 } ] }, { "idx": 341, "layers": [ "model.layers.57.self_attn.o_proj" ], "candidates": [ { "dkld": 3.882544115187125e-06, "dbits": 62914560 }, { "dkld": -7.055723108349843e-06, "dbits": 125829120 } ] }, { "idx": 342, "layers": [ "model.layers.57.mlp.shared_experts.gate_proj", "model.layers.57.mlp.shared_experts.up_proj", "model.layers.57.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 1.5323678962887027e-05, "dbits": 23592960 }, { "dkld": 1.0285456664860942e-05, "dbits": 47185920 } ] }, { "idx": 343, "layers": [ "model.layers.57.mlp.experts.0.gate_proj", "model.layers.57.mlp.experts.1.gate_proj", "model.layers.57.mlp.experts.2.gate_proj", "model.layers.57.mlp.experts.3.gate_proj", "model.layers.57.mlp.experts.4.gate_proj", "model.layers.57.mlp.experts.5.gate_proj", "model.layers.57.mlp.experts.6.gate_proj", "model.layers.57.mlp.experts.7.gate_proj", "model.layers.57.mlp.experts.8.gate_proj", "model.layers.57.mlp.experts.9.gate_proj", "model.layers.57.mlp.experts.10.gate_proj", "model.layers.57.mlp.experts.11.gate_proj", "model.layers.57.mlp.experts.12.gate_proj", "model.layers.57.mlp.experts.13.gate_proj", "model.layers.57.mlp.experts.14.gate_proj", "model.layers.57.mlp.experts.15.gate_proj", "model.layers.57.mlp.experts.16.gate_proj", "model.layers.57.mlp.experts.17.gate_proj", "model.layers.57.mlp.experts.18.gate_proj", "model.layers.57.mlp.experts.19.gate_proj", "model.layers.57.mlp.experts.20.gate_proj", "model.layers.57.mlp.experts.21.gate_proj", "model.layers.57.mlp.experts.22.gate_proj", "model.layers.57.mlp.experts.23.gate_proj", "model.layers.57.mlp.experts.24.gate_proj", "model.layers.57.mlp.experts.25.gate_proj", "model.layers.57.mlp.experts.26.gate_proj", "model.layers.57.mlp.experts.27.gate_proj", "model.layers.57.mlp.experts.28.gate_proj", "model.layers.57.mlp.experts.29.gate_proj", "model.layers.57.mlp.experts.30.gate_proj", "model.layers.57.mlp.experts.31.gate_proj", "model.layers.57.mlp.experts.32.gate_proj", "model.layers.57.mlp.experts.33.gate_proj", "model.layers.57.mlp.experts.34.gate_proj", "model.layers.57.mlp.experts.35.gate_proj", "model.layers.57.mlp.experts.36.gate_proj", "model.layers.57.mlp.experts.37.gate_proj", "model.layers.57.mlp.experts.38.gate_proj", "model.layers.57.mlp.experts.39.gate_proj", "model.layers.57.mlp.experts.40.gate_proj", "model.layers.57.mlp.experts.41.gate_proj", "model.layers.57.mlp.experts.42.gate_proj", "model.layers.57.mlp.experts.43.gate_proj", "model.layers.57.mlp.experts.44.gate_proj", "model.layers.57.mlp.experts.45.gate_proj", "model.layers.57.mlp.experts.46.gate_proj", "model.layers.57.mlp.experts.47.gate_proj", "model.layers.57.mlp.experts.48.gate_proj", "model.layers.57.mlp.experts.49.gate_proj", "model.layers.57.mlp.experts.50.gate_proj", "model.layers.57.mlp.experts.51.gate_proj", "model.layers.57.mlp.experts.52.gate_proj", "model.layers.57.mlp.experts.53.gate_proj", "model.layers.57.mlp.experts.54.gate_proj", "model.layers.57.mlp.experts.55.gate_proj", "model.layers.57.mlp.experts.56.gate_proj", "model.layers.57.mlp.experts.57.gate_proj", "model.layers.57.mlp.experts.58.gate_proj", "model.layers.57.mlp.experts.59.gate_proj", "model.layers.57.mlp.experts.60.gate_proj", "model.layers.57.mlp.experts.61.gate_proj", "model.layers.57.mlp.experts.62.gate_proj", "model.layers.57.mlp.experts.63.gate_proj", "model.layers.57.mlp.experts.64.gate_proj", "model.layers.57.mlp.experts.65.gate_proj", "model.layers.57.mlp.experts.66.gate_proj", "model.layers.57.mlp.experts.67.gate_proj", "model.layers.57.mlp.experts.68.gate_proj", "model.layers.57.mlp.experts.69.gate_proj", "model.layers.57.mlp.experts.70.gate_proj", "model.layers.57.mlp.experts.71.gate_proj", "model.layers.57.mlp.experts.72.gate_proj", "model.layers.57.mlp.experts.73.gate_proj", "model.layers.57.mlp.experts.74.gate_proj", "model.layers.57.mlp.experts.75.gate_proj", "model.layers.57.mlp.experts.76.gate_proj", "model.layers.57.mlp.experts.77.gate_proj", "model.layers.57.mlp.experts.78.gate_proj", "model.layers.57.mlp.experts.79.gate_proj", "model.layers.57.mlp.experts.80.gate_proj", "model.layers.57.mlp.experts.81.gate_proj", "model.layers.57.mlp.experts.82.gate_proj", "model.layers.57.mlp.experts.83.gate_proj", "model.layers.57.mlp.experts.84.gate_proj", "model.layers.57.mlp.experts.85.gate_proj", "model.layers.57.mlp.experts.86.gate_proj", "model.layers.57.mlp.experts.87.gate_proj", "model.layers.57.mlp.experts.88.gate_proj", "model.layers.57.mlp.experts.89.gate_proj", "model.layers.57.mlp.experts.90.gate_proj", "model.layers.57.mlp.experts.91.gate_proj", "model.layers.57.mlp.experts.92.gate_proj", "model.layers.57.mlp.experts.93.gate_proj", "model.layers.57.mlp.experts.94.gate_proj", "model.layers.57.mlp.experts.95.gate_proj", "model.layers.57.mlp.experts.96.gate_proj", "model.layers.57.mlp.experts.97.gate_proj", "model.layers.57.mlp.experts.98.gate_proj", "model.layers.57.mlp.experts.99.gate_proj", "model.layers.57.mlp.experts.100.gate_proj", "model.layers.57.mlp.experts.101.gate_proj", "model.layers.57.mlp.experts.102.gate_proj", "model.layers.57.mlp.experts.103.gate_proj", "model.layers.57.mlp.experts.104.gate_proj", "model.layers.57.mlp.experts.105.gate_proj", "model.layers.57.mlp.experts.106.gate_proj", "model.layers.57.mlp.experts.107.gate_proj", "model.layers.57.mlp.experts.108.gate_proj", "model.layers.57.mlp.experts.109.gate_proj", "model.layers.57.mlp.experts.110.gate_proj", "model.layers.57.mlp.experts.111.gate_proj", "model.layers.57.mlp.experts.112.gate_proj", "model.layers.57.mlp.experts.113.gate_proj", "model.layers.57.mlp.experts.114.gate_proj", "model.layers.57.mlp.experts.115.gate_proj", "model.layers.57.mlp.experts.116.gate_proj", "model.layers.57.mlp.experts.117.gate_proj", "model.layers.57.mlp.experts.118.gate_proj", "model.layers.57.mlp.experts.119.gate_proj", "model.layers.57.mlp.experts.120.gate_proj", "model.layers.57.mlp.experts.121.gate_proj", "model.layers.57.mlp.experts.122.gate_proj", "model.layers.57.mlp.experts.123.gate_proj", "model.layers.57.mlp.experts.124.gate_proj", "model.layers.57.mlp.experts.125.gate_proj", "model.layers.57.mlp.experts.126.gate_proj", "model.layers.57.mlp.experts.127.gate_proj", "model.layers.57.mlp.experts.128.gate_proj", "model.layers.57.mlp.experts.129.gate_proj", "model.layers.57.mlp.experts.130.gate_proj", "model.layers.57.mlp.experts.131.gate_proj", "model.layers.57.mlp.experts.132.gate_proj", "model.layers.57.mlp.experts.133.gate_proj", "model.layers.57.mlp.experts.134.gate_proj", "model.layers.57.mlp.experts.135.gate_proj", "model.layers.57.mlp.experts.136.gate_proj", "model.layers.57.mlp.experts.137.gate_proj", "model.layers.57.mlp.experts.138.gate_proj", "model.layers.57.mlp.experts.139.gate_proj", "model.layers.57.mlp.experts.140.gate_proj", "model.layers.57.mlp.experts.141.gate_proj", "model.layers.57.mlp.experts.142.gate_proj", "model.layers.57.mlp.experts.143.gate_proj", "model.layers.57.mlp.experts.144.gate_proj", "model.layers.57.mlp.experts.145.gate_proj", "model.layers.57.mlp.experts.146.gate_proj", "model.layers.57.mlp.experts.147.gate_proj", "model.layers.57.mlp.experts.148.gate_proj", "model.layers.57.mlp.experts.149.gate_proj", "model.layers.57.mlp.experts.150.gate_proj", "model.layers.57.mlp.experts.151.gate_proj", "model.layers.57.mlp.experts.152.gate_proj", "model.layers.57.mlp.experts.153.gate_proj", "model.layers.57.mlp.experts.154.gate_proj", "model.layers.57.mlp.experts.155.gate_proj", "model.layers.57.mlp.experts.156.gate_proj", "model.layers.57.mlp.experts.157.gate_proj", "model.layers.57.mlp.experts.158.gate_proj", "model.layers.57.mlp.experts.159.gate_proj", "model.layers.57.mlp.experts.0.up_proj", "model.layers.57.mlp.experts.1.up_proj", "model.layers.57.mlp.experts.2.up_proj", "model.layers.57.mlp.experts.3.up_proj", "model.layers.57.mlp.experts.4.up_proj", "model.layers.57.mlp.experts.5.up_proj", "model.layers.57.mlp.experts.6.up_proj", "model.layers.57.mlp.experts.7.up_proj", "model.layers.57.mlp.experts.8.up_proj", "model.layers.57.mlp.experts.9.up_proj", "model.layers.57.mlp.experts.10.up_proj", "model.layers.57.mlp.experts.11.up_proj", "model.layers.57.mlp.experts.12.up_proj", "model.layers.57.mlp.experts.13.up_proj", "model.layers.57.mlp.experts.14.up_proj", "model.layers.57.mlp.experts.15.up_proj", "model.layers.57.mlp.experts.16.up_proj", "model.layers.57.mlp.experts.17.up_proj", "model.layers.57.mlp.experts.18.up_proj", "model.layers.57.mlp.experts.19.up_proj", "model.layers.57.mlp.experts.20.up_proj", "model.layers.57.mlp.experts.21.up_proj", "model.layers.57.mlp.experts.22.up_proj", "model.layers.57.mlp.experts.23.up_proj", "model.layers.57.mlp.experts.24.up_proj", "model.layers.57.mlp.experts.25.up_proj", "model.layers.57.mlp.experts.26.up_proj", "model.layers.57.mlp.experts.27.up_proj", "model.layers.57.mlp.experts.28.up_proj", "model.layers.57.mlp.experts.29.up_proj", "model.layers.57.mlp.experts.30.up_proj", "model.layers.57.mlp.experts.31.up_proj", "model.layers.57.mlp.experts.32.up_proj", "model.layers.57.mlp.experts.33.up_proj", "model.layers.57.mlp.experts.34.up_proj", "model.layers.57.mlp.experts.35.up_proj", "model.layers.57.mlp.experts.36.up_proj", "model.layers.57.mlp.experts.37.up_proj", "model.layers.57.mlp.experts.38.up_proj", "model.layers.57.mlp.experts.39.up_proj", "model.layers.57.mlp.experts.40.up_proj", "model.layers.57.mlp.experts.41.up_proj", "model.layers.57.mlp.experts.42.up_proj", "model.layers.57.mlp.experts.43.up_proj", "model.layers.57.mlp.experts.44.up_proj", "model.layers.57.mlp.experts.45.up_proj", "model.layers.57.mlp.experts.46.up_proj", "model.layers.57.mlp.experts.47.up_proj", "model.layers.57.mlp.experts.48.up_proj", "model.layers.57.mlp.experts.49.up_proj", "model.layers.57.mlp.experts.50.up_proj", "model.layers.57.mlp.experts.51.up_proj", "model.layers.57.mlp.experts.52.up_proj", "model.layers.57.mlp.experts.53.up_proj", "model.layers.57.mlp.experts.54.up_proj", "model.layers.57.mlp.experts.55.up_proj", "model.layers.57.mlp.experts.56.up_proj", "model.layers.57.mlp.experts.57.up_proj", "model.layers.57.mlp.experts.58.up_proj", "model.layers.57.mlp.experts.59.up_proj", "model.layers.57.mlp.experts.60.up_proj", "model.layers.57.mlp.experts.61.up_proj", "model.layers.57.mlp.experts.62.up_proj", "model.layers.57.mlp.experts.63.up_proj", "model.layers.57.mlp.experts.64.up_proj", "model.layers.57.mlp.experts.65.up_proj", "model.layers.57.mlp.experts.66.up_proj", "model.layers.57.mlp.experts.67.up_proj", "model.layers.57.mlp.experts.68.up_proj", "model.layers.57.mlp.experts.69.up_proj", "model.layers.57.mlp.experts.70.up_proj", "model.layers.57.mlp.experts.71.up_proj", "model.layers.57.mlp.experts.72.up_proj", "model.layers.57.mlp.experts.73.up_proj", "model.layers.57.mlp.experts.74.up_proj", "model.layers.57.mlp.experts.75.up_proj", "model.layers.57.mlp.experts.76.up_proj", "model.layers.57.mlp.experts.77.up_proj", "model.layers.57.mlp.experts.78.up_proj", "model.layers.57.mlp.experts.79.up_proj", "model.layers.57.mlp.experts.80.up_proj", "model.layers.57.mlp.experts.81.up_proj", "model.layers.57.mlp.experts.82.up_proj", "model.layers.57.mlp.experts.83.up_proj", "model.layers.57.mlp.experts.84.up_proj", "model.layers.57.mlp.experts.85.up_proj", "model.layers.57.mlp.experts.86.up_proj", "model.layers.57.mlp.experts.87.up_proj", "model.layers.57.mlp.experts.88.up_proj", "model.layers.57.mlp.experts.89.up_proj", "model.layers.57.mlp.experts.90.up_proj", "model.layers.57.mlp.experts.91.up_proj", "model.layers.57.mlp.experts.92.up_proj", "model.layers.57.mlp.experts.93.up_proj", "model.layers.57.mlp.experts.94.up_proj", "model.layers.57.mlp.experts.95.up_proj", "model.layers.57.mlp.experts.96.up_proj", "model.layers.57.mlp.experts.97.up_proj", "model.layers.57.mlp.experts.98.up_proj", "model.layers.57.mlp.experts.99.up_proj", "model.layers.57.mlp.experts.100.up_proj", "model.layers.57.mlp.experts.101.up_proj", "model.layers.57.mlp.experts.102.up_proj", "model.layers.57.mlp.experts.103.up_proj", "model.layers.57.mlp.experts.104.up_proj", "model.layers.57.mlp.experts.105.up_proj", "model.layers.57.mlp.experts.106.up_proj", "model.layers.57.mlp.experts.107.up_proj", "model.layers.57.mlp.experts.108.up_proj", "model.layers.57.mlp.experts.109.up_proj", "model.layers.57.mlp.experts.110.up_proj", "model.layers.57.mlp.experts.111.up_proj", "model.layers.57.mlp.experts.112.up_proj", "model.layers.57.mlp.experts.113.up_proj", "model.layers.57.mlp.experts.114.up_proj", "model.layers.57.mlp.experts.115.up_proj", "model.layers.57.mlp.experts.116.up_proj", "model.layers.57.mlp.experts.117.up_proj", "model.layers.57.mlp.experts.118.up_proj", "model.layers.57.mlp.experts.119.up_proj", "model.layers.57.mlp.experts.120.up_proj", "model.layers.57.mlp.experts.121.up_proj", "model.layers.57.mlp.experts.122.up_proj", "model.layers.57.mlp.experts.123.up_proj", "model.layers.57.mlp.experts.124.up_proj", "model.layers.57.mlp.experts.125.up_proj", "model.layers.57.mlp.experts.126.up_proj", "model.layers.57.mlp.experts.127.up_proj", "model.layers.57.mlp.experts.128.up_proj", "model.layers.57.mlp.experts.129.up_proj", "model.layers.57.mlp.experts.130.up_proj", "model.layers.57.mlp.experts.131.up_proj", "model.layers.57.mlp.experts.132.up_proj", "model.layers.57.mlp.experts.133.up_proj", "model.layers.57.mlp.experts.134.up_proj", "model.layers.57.mlp.experts.135.up_proj", "model.layers.57.mlp.experts.136.up_proj", "model.layers.57.mlp.experts.137.up_proj", "model.layers.57.mlp.experts.138.up_proj", "model.layers.57.mlp.experts.139.up_proj", "model.layers.57.mlp.experts.140.up_proj", "model.layers.57.mlp.experts.141.up_proj", "model.layers.57.mlp.experts.142.up_proj", "model.layers.57.mlp.experts.143.up_proj", "model.layers.57.mlp.experts.144.up_proj", "model.layers.57.mlp.experts.145.up_proj", "model.layers.57.mlp.experts.146.up_proj", "model.layers.57.mlp.experts.147.up_proj", "model.layers.57.mlp.experts.148.up_proj", "model.layers.57.mlp.experts.149.up_proj", "model.layers.57.mlp.experts.150.up_proj", "model.layers.57.mlp.experts.151.up_proj", "model.layers.57.mlp.experts.152.up_proj", "model.layers.57.mlp.experts.153.up_proj", "model.layers.57.mlp.experts.154.up_proj", "model.layers.57.mlp.experts.155.up_proj", "model.layers.57.mlp.experts.156.up_proj", "model.layers.57.mlp.experts.157.up_proj", "model.layers.57.mlp.experts.158.up_proj", "model.layers.57.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.176886726170917e-05, "dbits": 2516582400 }, { "dkld": 3.0976487323652185e-06, "dbits": 5033164800 } ] }, { "idx": 344, "layers": [ "model.layers.57.mlp.experts.0.down_proj", "model.layers.57.mlp.experts.1.down_proj", "model.layers.57.mlp.experts.2.down_proj", "model.layers.57.mlp.experts.3.down_proj", "model.layers.57.mlp.experts.4.down_proj", "model.layers.57.mlp.experts.5.down_proj", "model.layers.57.mlp.experts.6.down_proj", "model.layers.57.mlp.experts.7.down_proj", "model.layers.57.mlp.experts.8.down_proj", "model.layers.57.mlp.experts.9.down_proj", "model.layers.57.mlp.experts.10.down_proj", "model.layers.57.mlp.experts.11.down_proj", "model.layers.57.mlp.experts.12.down_proj", "model.layers.57.mlp.experts.13.down_proj", "model.layers.57.mlp.experts.14.down_proj", "model.layers.57.mlp.experts.15.down_proj", "model.layers.57.mlp.experts.16.down_proj", "model.layers.57.mlp.experts.17.down_proj", "model.layers.57.mlp.experts.18.down_proj", "model.layers.57.mlp.experts.19.down_proj", "model.layers.57.mlp.experts.20.down_proj", "model.layers.57.mlp.experts.21.down_proj", "model.layers.57.mlp.experts.22.down_proj", "model.layers.57.mlp.experts.23.down_proj", "model.layers.57.mlp.experts.24.down_proj", "model.layers.57.mlp.experts.25.down_proj", "model.layers.57.mlp.experts.26.down_proj", "model.layers.57.mlp.experts.27.down_proj", "model.layers.57.mlp.experts.28.down_proj", "model.layers.57.mlp.experts.29.down_proj", "model.layers.57.mlp.experts.30.down_proj", "model.layers.57.mlp.experts.31.down_proj", "model.layers.57.mlp.experts.32.down_proj", "model.layers.57.mlp.experts.33.down_proj", "model.layers.57.mlp.experts.34.down_proj", "model.layers.57.mlp.experts.35.down_proj", "model.layers.57.mlp.experts.36.down_proj", "model.layers.57.mlp.experts.37.down_proj", "model.layers.57.mlp.experts.38.down_proj", "model.layers.57.mlp.experts.39.down_proj", "model.layers.57.mlp.experts.40.down_proj", "model.layers.57.mlp.experts.41.down_proj", "model.layers.57.mlp.experts.42.down_proj", "model.layers.57.mlp.experts.43.down_proj", "model.layers.57.mlp.experts.44.down_proj", "model.layers.57.mlp.experts.45.down_proj", "model.layers.57.mlp.experts.46.down_proj", "model.layers.57.mlp.experts.47.down_proj", "model.layers.57.mlp.experts.48.down_proj", "model.layers.57.mlp.experts.49.down_proj", "model.layers.57.mlp.experts.50.down_proj", "model.layers.57.mlp.experts.51.down_proj", "model.layers.57.mlp.experts.52.down_proj", "model.layers.57.mlp.experts.53.down_proj", "model.layers.57.mlp.experts.54.down_proj", "model.layers.57.mlp.experts.55.down_proj", "model.layers.57.mlp.experts.56.down_proj", "model.layers.57.mlp.experts.57.down_proj", "model.layers.57.mlp.experts.58.down_proj", "model.layers.57.mlp.experts.59.down_proj", "model.layers.57.mlp.experts.60.down_proj", "model.layers.57.mlp.experts.61.down_proj", "model.layers.57.mlp.experts.62.down_proj", "model.layers.57.mlp.experts.63.down_proj", "model.layers.57.mlp.experts.64.down_proj", "model.layers.57.mlp.experts.65.down_proj", "model.layers.57.mlp.experts.66.down_proj", "model.layers.57.mlp.experts.67.down_proj", "model.layers.57.mlp.experts.68.down_proj", "model.layers.57.mlp.experts.69.down_proj", "model.layers.57.mlp.experts.70.down_proj", "model.layers.57.mlp.experts.71.down_proj", "model.layers.57.mlp.experts.72.down_proj", "model.layers.57.mlp.experts.73.down_proj", "model.layers.57.mlp.experts.74.down_proj", "model.layers.57.mlp.experts.75.down_proj", "model.layers.57.mlp.experts.76.down_proj", "model.layers.57.mlp.experts.77.down_proj", "model.layers.57.mlp.experts.78.down_proj", "model.layers.57.mlp.experts.79.down_proj", "model.layers.57.mlp.experts.80.down_proj", "model.layers.57.mlp.experts.81.down_proj", "model.layers.57.mlp.experts.82.down_proj", "model.layers.57.mlp.experts.83.down_proj", "model.layers.57.mlp.experts.84.down_proj", "model.layers.57.mlp.experts.85.down_proj", "model.layers.57.mlp.experts.86.down_proj", "model.layers.57.mlp.experts.87.down_proj", "model.layers.57.mlp.experts.88.down_proj", "model.layers.57.mlp.experts.89.down_proj", "model.layers.57.mlp.experts.90.down_proj", "model.layers.57.mlp.experts.91.down_proj", "model.layers.57.mlp.experts.92.down_proj", "model.layers.57.mlp.experts.93.down_proj", "model.layers.57.mlp.experts.94.down_proj", "model.layers.57.mlp.experts.95.down_proj", "model.layers.57.mlp.experts.96.down_proj", "model.layers.57.mlp.experts.97.down_proj", "model.layers.57.mlp.experts.98.down_proj", "model.layers.57.mlp.experts.99.down_proj", "model.layers.57.mlp.experts.100.down_proj", "model.layers.57.mlp.experts.101.down_proj", "model.layers.57.mlp.experts.102.down_proj", "model.layers.57.mlp.experts.103.down_proj", "model.layers.57.mlp.experts.104.down_proj", "model.layers.57.mlp.experts.105.down_proj", "model.layers.57.mlp.experts.106.down_proj", "model.layers.57.mlp.experts.107.down_proj", "model.layers.57.mlp.experts.108.down_proj", "model.layers.57.mlp.experts.109.down_proj", "model.layers.57.mlp.experts.110.down_proj", "model.layers.57.mlp.experts.111.down_proj", "model.layers.57.mlp.experts.112.down_proj", "model.layers.57.mlp.experts.113.down_proj", "model.layers.57.mlp.experts.114.down_proj", "model.layers.57.mlp.experts.115.down_proj", "model.layers.57.mlp.experts.116.down_proj", "model.layers.57.mlp.experts.117.down_proj", "model.layers.57.mlp.experts.118.down_proj", "model.layers.57.mlp.experts.119.down_proj", "model.layers.57.mlp.experts.120.down_proj", "model.layers.57.mlp.experts.121.down_proj", "model.layers.57.mlp.experts.122.down_proj", "model.layers.57.mlp.experts.123.down_proj", "model.layers.57.mlp.experts.124.down_proj", "model.layers.57.mlp.experts.125.down_proj", "model.layers.57.mlp.experts.126.down_proj", "model.layers.57.mlp.experts.127.down_proj", "model.layers.57.mlp.experts.128.down_proj", "model.layers.57.mlp.experts.129.down_proj", "model.layers.57.mlp.experts.130.down_proj", "model.layers.57.mlp.experts.131.down_proj", "model.layers.57.mlp.experts.132.down_proj", "model.layers.57.mlp.experts.133.down_proj", "model.layers.57.mlp.experts.134.down_proj", "model.layers.57.mlp.experts.135.down_proj", "model.layers.57.mlp.experts.136.down_proj", "model.layers.57.mlp.experts.137.down_proj", "model.layers.57.mlp.experts.138.down_proj", "model.layers.57.mlp.experts.139.down_proj", "model.layers.57.mlp.experts.140.down_proj", "model.layers.57.mlp.experts.141.down_proj", "model.layers.57.mlp.experts.142.down_proj", "model.layers.57.mlp.experts.143.down_proj", "model.layers.57.mlp.experts.144.down_proj", "model.layers.57.mlp.experts.145.down_proj", "model.layers.57.mlp.experts.146.down_proj", "model.layers.57.mlp.experts.147.down_proj", "model.layers.57.mlp.experts.148.down_proj", "model.layers.57.mlp.experts.149.down_proj", "model.layers.57.mlp.experts.150.down_proj", "model.layers.57.mlp.experts.151.down_proj", "model.layers.57.mlp.experts.152.down_proj", "model.layers.57.mlp.experts.153.down_proj", "model.layers.57.mlp.experts.154.down_proj", "model.layers.57.mlp.experts.155.down_proj", "model.layers.57.mlp.experts.156.down_proj", "model.layers.57.mlp.experts.157.down_proj", "model.layers.57.mlp.experts.158.down_proj", "model.layers.57.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.2455188445746205e-05, "dbits": 1258291200 }, { "dkld": -2.472677733749047e-05, "dbits": 2516582400 } ] }, { "idx": 345, "layers": [ "model.layers.58.self_attn.q_proj" ], "candidates": [ { "dkld": 1.9354745745658875e-05, "dbits": 62914560 }, { "dkld": -7.470394484697385e-06, "dbits": 125829120 } ] }, { "idx": 346, "layers": [ "model.layers.58.self_attn.k_proj", "model.layers.58.self_attn.v_proj" ], "candidates": [ { "dkld": 3.495579585434394e-06, "dbits": 10485760 }, { "dkld": -1.3352045789359612e-05, "dbits": 20971520 } ] }, { "idx": 347, "layers": [ "model.layers.58.self_attn.o_proj" ], "candidates": [ { "dkld": -1.281597651541129e-05, "dbits": 62914560 }, { "dkld": -1.1577550321816357e-05, "dbits": 125829120 } ] }, { "idx": 348, "layers": [ "model.layers.58.mlp.shared_experts.gate_proj", "model.layers.58.mlp.shared_experts.up_proj", "model.layers.58.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 5.300231277942727e-05, "dbits": 23592960 }, { "dkld": 4.304291214794059e-05, "dbits": 47185920 } ] }, { "idx": 349, "layers": [ "model.layers.58.mlp.experts.0.gate_proj", "model.layers.58.mlp.experts.1.gate_proj", "model.layers.58.mlp.experts.2.gate_proj", "model.layers.58.mlp.experts.3.gate_proj", "model.layers.58.mlp.experts.4.gate_proj", "model.layers.58.mlp.experts.5.gate_proj", "model.layers.58.mlp.experts.6.gate_proj", "model.layers.58.mlp.experts.7.gate_proj", "model.layers.58.mlp.experts.8.gate_proj", "model.layers.58.mlp.experts.9.gate_proj", "model.layers.58.mlp.experts.10.gate_proj", "model.layers.58.mlp.experts.11.gate_proj", "model.layers.58.mlp.experts.12.gate_proj", "model.layers.58.mlp.experts.13.gate_proj", "model.layers.58.mlp.experts.14.gate_proj", "model.layers.58.mlp.experts.15.gate_proj", "model.layers.58.mlp.experts.16.gate_proj", "model.layers.58.mlp.experts.17.gate_proj", "model.layers.58.mlp.experts.18.gate_proj", "model.layers.58.mlp.experts.19.gate_proj", "model.layers.58.mlp.experts.20.gate_proj", "model.layers.58.mlp.experts.21.gate_proj", "model.layers.58.mlp.experts.22.gate_proj", "model.layers.58.mlp.experts.23.gate_proj", "model.layers.58.mlp.experts.24.gate_proj", "model.layers.58.mlp.experts.25.gate_proj", "model.layers.58.mlp.experts.26.gate_proj", "model.layers.58.mlp.experts.27.gate_proj", "model.layers.58.mlp.experts.28.gate_proj", "model.layers.58.mlp.experts.29.gate_proj", "model.layers.58.mlp.experts.30.gate_proj", "model.layers.58.mlp.experts.31.gate_proj", "model.layers.58.mlp.experts.32.gate_proj", "model.layers.58.mlp.experts.33.gate_proj", "model.layers.58.mlp.experts.34.gate_proj", "model.layers.58.mlp.experts.35.gate_proj", "model.layers.58.mlp.experts.36.gate_proj", "model.layers.58.mlp.experts.37.gate_proj", "model.layers.58.mlp.experts.38.gate_proj", "model.layers.58.mlp.experts.39.gate_proj", "model.layers.58.mlp.experts.40.gate_proj", "model.layers.58.mlp.experts.41.gate_proj", "model.layers.58.mlp.experts.42.gate_proj", "model.layers.58.mlp.experts.43.gate_proj", "model.layers.58.mlp.experts.44.gate_proj", "model.layers.58.mlp.experts.45.gate_proj", "model.layers.58.mlp.experts.46.gate_proj", "model.layers.58.mlp.experts.47.gate_proj", "model.layers.58.mlp.experts.48.gate_proj", "model.layers.58.mlp.experts.49.gate_proj", "model.layers.58.mlp.experts.50.gate_proj", "model.layers.58.mlp.experts.51.gate_proj", "model.layers.58.mlp.experts.52.gate_proj", "model.layers.58.mlp.experts.53.gate_proj", "model.layers.58.mlp.experts.54.gate_proj", "model.layers.58.mlp.experts.55.gate_proj", "model.layers.58.mlp.experts.56.gate_proj", "model.layers.58.mlp.experts.57.gate_proj", "model.layers.58.mlp.experts.58.gate_proj", "model.layers.58.mlp.experts.59.gate_proj", "model.layers.58.mlp.experts.60.gate_proj", "model.layers.58.mlp.experts.61.gate_proj", "model.layers.58.mlp.experts.62.gate_proj", "model.layers.58.mlp.experts.63.gate_proj", "model.layers.58.mlp.experts.64.gate_proj", "model.layers.58.mlp.experts.65.gate_proj", "model.layers.58.mlp.experts.66.gate_proj", "model.layers.58.mlp.experts.67.gate_proj", "model.layers.58.mlp.experts.68.gate_proj", "model.layers.58.mlp.experts.69.gate_proj", "model.layers.58.mlp.experts.70.gate_proj", "model.layers.58.mlp.experts.71.gate_proj", "model.layers.58.mlp.experts.72.gate_proj", "model.layers.58.mlp.experts.73.gate_proj", "model.layers.58.mlp.experts.74.gate_proj", "model.layers.58.mlp.experts.75.gate_proj", "model.layers.58.mlp.experts.76.gate_proj", "model.layers.58.mlp.experts.77.gate_proj", "model.layers.58.mlp.experts.78.gate_proj", "model.layers.58.mlp.experts.79.gate_proj", "model.layers.58.mlp.experts.80.gate_proj", "model.layers.58.mlp.experts.81.gate_proj", "model.layers.58.mlp.experts.82.gate_proj", "model.layers.58.mlp.experts.83.gate_proj", "model.layers.58.mlp.experts.84.gate_proj", "model.layers.58.mlp.experts.85.gate_proj", "model.layers.58.mlp.experts.86.gate_proj", "model.layers.58.mlp.experts.87.gate_proj", "model.layers.58.mlp.experts.88.gate_proj", "model.layers.58.mlp.experts.89.gate_proj", "model.layers.58.mlp.experts.90.gate_proj", "model.layers.58.mlp.experts.91.gate_proj", "model.layers.58.mlp.experts.92.gate_proj", "model.layers.58.mlp.experts.93.gate_proj", "model.layers.58.mlp.experts.94.gate_proj", "model.layers.58.mlp.experts.95.gate_proj", "model.layers.58.mlp.experts.96.gate_proj", "model.layers.58.mlp.experts.97.gate_proj", "model.layers.58.mlp.experts.98.gate_proj", "model.layers.58.mlp.experts.99.gate_proj", "model.layers.58.mlp.experts.100.gate_proj", "model.layers.58.mlp.experts.101.gate_proj", "model.layers.58.mlp.experts.102.gate_proj", "model.layers.58.mlp.experts.103.gate_proj", "model.layers.58.mlp.experts.104.gate_proj", "model.layers.58.mlp.experts.105.gate_proj", "model.layers.58.mlp.experts.106.gate_proj", "model.layers.58.mlp.experts.107.gate_proj", "model.layers.58.mlp.experts.108.gate_proj", "model.layers.58.mlp.experts.109.gate_proj", "model.layers.58.mlp.experts.110.gate_proj", "model.layers.58.mlp.experts.111.gate_proj", "model.layers.58.mlp.experts.112.gate_proj", "model.layers.58.mlp.experts.113.gate_proj", "model.layers.58.mlp.experts.114.gate_proj", "model.layers.58.mlp.experts.115.gate_proj", "model.layers.58.mlp.experts.116.gate_proj", "model.layers.58.mlp.experts.117.gate_proj", "model.layers.58.mlp.experts.118.gate_proj", "model.layers.58.mlp.experts.119.gate_proj", "model.layers.58.mlp.experts.120.gate_proj", "model.layers.58.mlp.experts.121.gate_proj", "model.layers.58.mlp.experts.122.gate_proj", "model.layers.58.mlp.experts.123.gate_proj", "model.layers.58.mlp.experts.124.gate_proj", "model.layers.58.mlp.experts.125.gate_proj", "model.layers.58.mlp.experts.126.gate_proj", "model.layers.58.mlp.experts.127.gate_proj", "model.layers.58.mlp.experts.128.gate_proj", "model.layers.58.mlp.experts.129.gate_proj", "model.layers.58.mlp.experts.130.gate_proj", "model.layers.58.mlp.experts.131.gate_proj", "model.layers.58.mlp.experts.132.gate_proj", "model.layers.58.mlp.experts.133.gate_proj", "model.layers.58.mlp.experts.134.gate_proj", "model.layers.58.mlp.experts.135.gate_proj", "model.layers.58.mlp.experts.136.gate_proj", "model.layers.58.mlp.experts.137.gate_proj", "model.layers.58.mlp.experts.138.gate_proj", "model.layers.58.mlp.experts.139.gate_proj", "model.layers.58.mlp.experts.140.gate_proj", "model.layers.58.mlp.experts.141.gate_proj", "model.layers.58.mlp.experts.142.gate_proj", "model.layers.58.mlp.experts.143.gate_proj", "model.layers.58.mlp.experts.144.gate_proj", "model.layers.58.mlp.experts.145.gate_proj", "model.layers.58.mlp.experts.146.gate_proj", "model.layers.58.mlp.experts.147.gate_proj", "model.layers.58.mlp.experts.148.gate_proj", "model.layers.58.mlp.experts.149.gate_proj", "model.layers.58.mlp.experts.150.gate_proj", "model.layers.58.mlp.experts.151.gate_proj", "model.layers.58.mlp.experts.152.gate_proj", "model.layers.58.mlp.experts.153.gate_proj", "model.layers.58.mlp.experts.154.gate_proj", "model.layers.58.mlp.experts.155.gate_proj", "model.layers.58.mlp.experts.156.gate_proj", "model.layers.58.mlp.experts.157.gate_proj", "model.layers.58.mlp.experts.158.gate_proj", "model.layers.58.mlp.experts.159.gate_proj", "model.layers.58.mlp.experts.0.up_proj", "model.layers.58.mlp.experts.1.up_proj", "model.layers.58.mlp.experts.2.up_proj", "model.layers.58.mlp.experts.3.up_proj", "model.layers.58.mlp.experts.4.up_proj", "model.layers.58.mlp.experts.5.up_proj", "model.layers.58.mlp.experts.6.up_proj", "model.layers.58.mlp.experts.7.up_proj", "model.layers.58.mlp.experts.8.up_proj", "model.layers.58.mlp.experts.9.up_proj", "model.layers.58.mlp.experts.10.up_proj", "model.layers.58.mlp.experts.11.up_proj", "model.layers.58.mlp.experts.12.up_proj", "model.layers.58.mlp.experts.13.up_proj", "model.layers.58.mlp.experts.14.up_proj", "model.layers.58.mlp.experts.15.up_proj", "model.layers.58.mlp.experts.16.up_proj", "model.layers.58.mlp.experts.17.up_proj", "model.layers.58.mlp.experts.18.up_proj", "model.layers.58.mlp.experts.19.up_proj", "model.layers.58.mlp.experts.20.up_proj", "model.layers.58.mlp.experts.21.up_proj", "model.layers.58.mlp.experts.22.up_proj", "model.layers.58.mlp.experts.23.up_proj", "model.layers.58.mlp.experts.24.up_proj", "model.layers.58.mlp.experts.25.up_proj", "model.layers.58.mlp.experts.26.up_proj", "model.layers.58.mlp.experts.27.up_proj", "model.layers.58.mlp.experts.28.up_proj", "model.layers.58.mlp.experts.29.up_proj", "model.layers.58.mlp.experts.30.up_proj", "model.layers.58.mlp.experts.31.up_proj", "model.layers.58.mlp.experts.32.up_proj", "model.layers.58.mlp.experts.33.up_proj", "model.layers.58.mlp.experts.34.up_proj", "model.layers.58.mlp.experts.35.up_proj", "model.layers.58.mlp.experts.36.up_proj", "model.layers.58.mlp.experts.37.up_proj", "model.layers.58.mlp.experts.38.up_proj", "model.layers.58.mlp.experts.39.up_proj", "model.layers.58.mlp.experts.40.up_proj", "model.layers.58.mlp.experts.41.up_proj", "model.layers.58.mlp.experts.42.up_proj", "model.layers.58.mlp.experts.43.up_proj", "model.layers.58.mlp.experts.44.up_proj", "model.layers.58.mlp.experts.45.up_proj", "model.layers.58.mlp.experts.46.up_proj", "model.layers.58.mlp.experts.47.up_proj", "model.layers.58.mlp.experts.48.up_proj", "model.layers.58.mlp.experts.49.up_proj", "model.layers.58.mlp.experts.50.up_proj", "model.layers.58.mlp.experts.51.up_proj", "model.layers.58.mlp.experts.52.up_proj", "model.layers.58.mlp.experts.53.up_proj", "model.layers.58.mlp.experts.54.up_proj", "model.layers.58.mlp.experts.55.up_proj", "model.layers.58.mlp.experts.56.up_proj", "model.layers.58.mlp.experts.57.up_proj", "model.layers.58.mlp.experts.58.up_proj", "model.layers.58.mlp.experts.59.up_proj", "model.layers.58.mlp.experts.60.up_proj", "model.layers.58.mlp.experts.61.up_proj", "model.layers.58.mlp.experts.62.up_proj", "model.layers.58.mlp.experts.63.up_proj", "model.layers.58.mlp.experts.64.up_proj", "model.layers.58.mlp.experts.65.up_proj", "model.layers.58.mlp.experts.66.up_proj", "model.layers.58.mlp.experts.67.up_proj", "model.layers.58.mlp.experts.68.up_proj", "model.layers.58.mlp.experts.69.up_proj", "model.layers.58.mlp.experts.70.up_proj", "model.layers.58.mlp.experts.71.up_proj", "model.layers.58.mlp.experts.72.up_proj", "model.layers.58.mlp.experts.73.up_proj", "model.layers.58.mlp.experts.74.up_proj", "model.layers.58.mlp.experts.75.up_proj", "model.layers.58.mlp.experts.76.up_proj", "model.layers.58.mlp.experts.77.up_proj", "model.layers.58.mlp.experts.78.up_proj", "model.layers.58.mlp.experts.79.up_proj", "model.layers.58.mlp.experts.80.up_proj", "model.layers.58.mlp.experts.81.up_proj", "model.layers.58.mlp.experts.82.up_proj", "model.layers.58.mlp.experts.83.up_proj", "model.layers.58.mlp.experts.84.up_proj", "model.layers.58.mlp.experts.85.up_proj", "model.layers.58.mlp.experts.86.up_proj", "model.layers.58.mlp.experts.87.up_proj", "model.layers.58.mlp.experts.88.up_proj", "model.layers.58.mlp.experts.89.up_proj", "model.layers.58.mlp.experts.90.up_proj", "model.layers.58.mlp.experts.91.up_proj", "model.layers.58.mlp.experts.92.up_proj", "model.layers.58.mlp.experts.93.up_proj", "model.layers.58.mlp.experts.94.up_proj", "model.layers.58.mlp.experts.95.up_proj", "model.layers.58.mlp.experts.96.up_proj", "model.layers.58.mlp.experts.97.up_proj", "model.layers.58.mlp.experts.98.up_proj", "model.layers.58.mlp.experts.99.up_proj", "model.layers.58.mlp.experts.100.up_proj", "model.layers.58.mlp.experts.101.up_proj", "model.layers.58.mlp.experts.102.up_proj", "model.layers.58.mlp.experts.103.up_proj", "model.layers.58.mlp.experts.104.up_proj", "model.layers.58.mlp.experts.105.up_proj", "model.layers.58.mlp.experts.106.up_proj", "model.layers.58.mlp.experts.107.up_proj", "model.layers.58.mlp.experts.108.up_proj", "model.layers.58.mlp.experts.109.up_proj", "model.layers.58.mlp.experts.110.up_proj", "model.layers.58.mlp.experts.111.up_proj", "model.layers.58.mlp.experts.112.up_proj", "model.layers.58.mlp.experts.113.up_proj", "model.layers.58.mlp.experts.114.up_proj", "model.layers.58.mlp.experts.115.up_proj", "model.layers.58.mlp.experts.116.up_proj", "model.layers.58.mlp.experts.117.up_proj", "model.layers.58.mlp.experts.118.up_proj", "model.layers.58.mlp.experts.119.up_proj", "model.layers.58.mlp.experts.120.up_proj", "model.layers.58.mlp.experts.121.up_proj", "model.layers.58.mlp.experts.122.up_proj", "model.layers.58.mlp.experts.123.up_proj", "model.layers.58.mlp.experts.124.up_proj", "model.layers.58.mlp.experts.125.up_proj", "model.layers.58.mlp.experts.126.up_proj", "model.layers.58.mlp.experts.127.up_proj", "model.layers.58.mlp.experts.128.up_proj", "model.layers.58.mlp.experts.129.up_proj", "model.layers.58.mlp.experts.130.up_proj", "model.layers.58.mlp.experts.131.up_proj", "model.layers.58.mlp.experts.132.up_proj", "model.layers.58.mlp.experts.133.up_proj", "model.layers.58.mlp.experts.134.up_proj", "model.layers.58.mlp.experts.135.up_proj", "model.layers.58.mlp.experts.136.up_proj", "model.layers.58.mlp.experts.137.up_proj", "model.layers.58.mlp.experts.138.up_proj", "model.layers.58.mlp.experts.139.up_proj", "model.layers.58.mlp.experts.140.up_proj", "model.layers.58.mlp.experts.141.up_proj", "model.layers.58.mlp.experts.142.up_proj", "model.layers.58.mlp.experts.143.up_proj", "model.layers.58.mlp.experts.144.up_proj", "model.layers.58.mlp.experts.145.up_proj", "model.layers.58.mlp.experts.146.up_proj", "model.layers.58.mlp.experts.147.up_proj", "model.layers.58.mlp.experts.148.up_proj", "model.layers.58.mlp.experts.149.up_proj", "model.layers.58.mlp.experts.150.up_proj", "model.layers.58.mlp.experts.151.up_proj", "model.layers.58.mlp.experts.152.up_proj", "model.layers.58.mlp.experts.153.up_proj", "model.layers.58.mlp.experts.154.up_proj", "model.layers.58.mlp.experts.155.up_proj", "model.layers.58.mlp.experts.156.up_proj", "model.layers.58.mlp.experts.157.up_proj", "model.layers.58.mlp.experts.158.up_proj", "model.layers.58.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.1325860396028259e-05, "dbits": 2516582400 }, { "dkld": 1.7218058928847313e-05, "dbits": 5033164800 } ] }, { "idx": 350, "layers": [ "model.layers.58.mlp.experts.0.down_proj", "model.layers.58.mlp.experts.1.down_proj", "model.layers.58.mlp.experts.2.down_proj", "model.layers.58.mlp.experts.3.down_proj", "model.layers.58.mlp.experts.4.down_proj", "model.layers.58.mlp.experts.5.down_proj", "model.layers.58.mlp.experts.6.down_proj", "model.layers.58.mlp.experts.7.down_proj", "model.layers.58.mlp.experts.8.down_proj", "model.layers.58.mlp.experts.9.down_proj", "model.layers.58.mlp.experts.10.down_proj", "model.layers.58.mlp.experts.11.down_proj", "model.layers.58.mlp.experts.12.down_proj", "model.layers.58.mlp.experts.13.down_proj", "model.layers.58.mlp.experts.14.down_proj", "model.layers.58.mlp.experts.15.down_proj", "model.layers.58.mlp.experts.16.down_proj", "model.layers.58.mlp.experts.17.down_proj", "model.layers.58.mlp.experts.18.down_proj", "model.layers.58.mlp.experts.19.down_proj", "model.layers.58.mlp.experts.20.down_proj", "model.layers.58.mlp.experts.21.down_proj", "model.layers.58.mlp.experts.22.down_proj", "model.layers.58.mlp.experts.23.down_proj", "model.layers.58.mlp.experts.24.down_proj", "model.layers.58.mlp.experts.25.down_proj", "model.layers.58.mlp.experts.26.down_proj", "model.layers.58.mlp.experts.27.down_proj", "model.layers.58.mlp.experts.28.down_proj", "model.layers.58.mlp.experts.29.down_proj", "model.layers.58.mlp.experts.30.down_proj", "model.layers.58.mlp.experts.31.down_proj", "model.layers.58.mlp.experts.32.down_proj", "model.layers.58.mlp.experts.33.down_proj", "model.layers.58.mlp.experts.34.down_proj", "model.layers.58.mlp.experts.35.down_proj", "model.layers.58.mlp.experts.36.down_proj", "model.layers.58.mlp.experts.37.down_proj", "model.layers.58.mlp.experts.38.down_proj", "model.layers.58.mlp.experts.39.down_proj", "model.layers.58.mlp.experts.40.down_proj", "model.layers.58.mlp.experts.41.down_proj", "model.layers.58.mlp.experts.42.down_proj", "model.layers.58.mlp.experts.43.down_proj", "model.layers.58.mlp.experts.44.down_proj", "model.layers.58.mlp.experts.45.down_proj", "model.layers.58.mlp.experts.46.down_proj", "model.layers.58.mlp.experts.47.down_proj", "model.layers.58.mlp.experts.48.down_proj", "model.layers.58.mlp.experts.49.down_proj", "model.layers.58.mlp.experts.50.down_proj", "model.layers.58.mlp.experts.51.down_proj", "model.layers.58.mlp.experts.52.down_proj", "model.layers.58.mlp.experts.53.down_proj", "model.layers.58.mlp.experts.54.down_proj", "model.layers.58.mlp.experts.55.down_proj", "model.layers.58.mlp.experts.56.down_proj", "model.layers.58.mlp.experts.57.down_proj", "model.layers.58.mlp.experts.58.down_proj", "model.layers.58.mlp.experts.59.down_proj", "model.layers.58.mlp.experts.60.down_proj", "model.layers.58.mlp.experts.61.down_proj", "model.layers.58.mlp.experts.62.down_proj", "model.layers.58.mlp.experts.63.down_proj", "model.layers.58.mlp.experts.64.down_proj", "model.layers.58.mlp.experts.65.down_proj", "model.layers.58.mlp.experts.66.down_proj", "model.layers.58.mlp.experts.67.down_proj", "model.layers.58.mlp.experts.68.down_proj", "model.layers.58.mlp.experts.69.down_proj", "model.layers.58.mlp.experts.70.down_proj", "model.layers.58.mlp.experts.71.down_proj", "model.layers.58.mlp.experts.72.down_proj", "model.layers.58.mlp.experts.73.down_proj", "model.layers.58.mlp.experts.74.down_proj", "model.layers.58.mlp.experts.75.down_proj", "model.layers.58.mlp.experts.76.down_proj", "model.layers.58.mlp.experts.77.down_proj", "model.layers.58.mlp.experts.78.down_proj", "model.layers.58.mlp.experts.79.down_proj", "model.layers.58.mlp.experts.80.down_proj", "model.layers.58.mlp.experts.81.down_proj", "model.layers.58.mlp.experts.82.down_proj", "model.layers.58.mlp.experts.83.down_proj", "model.layers.58.mlp.experts.84.down_proj", "model.layers.58.mlp.experts.85.down_proj", "model.layers.58.mlp.experts.86.down_proj", "model.layers.58.mlp.experts.87.down_proj", "model.layers.58.mlp.experts.88.down_proj", "model.layers.58.mlp.experts.89.down_proj", "model.layers.58.mlp.experts.90.down_proj", "model.layers.58.mlp.experts.91.down_proj", "model.layers.58.mlp.experts.92.down_proj", "model.layers.58.mlp.experts.93.down_proj", "model.layers.58.mlp.experts.94.down_proj", "model.layers.58.mlp.experts.95.down_proj", "model.layers.58.mlp.experts.96.down_proj", "model.layers.58.mlp.experts.97.down_proj", "model.layers.58.mlp.experts.98.down_proj", "model.layers.58.mlp.experts.99.down_proj", "model.layers.58.mlp.experts.100.down_proj", "model.layers.58.mlp.experts.101.down_proj", "model.layers.58.mlp.experts.102.down_proj", "model.layers.58.mlp.experts.103.down_proj", "model.layers.58.mlp.experts.104.down_proj", "model.layers.58.mlp.experts.105.down_proj", "model.layers.58.mlp.experts.106.down_proj", "model.layers.58.mlp.experts.107.down_proj", "model.layers.58.mlp.experts.108.down_proj", "model.layers.58.mlp.experts.109.down_proj", "model.layers.58.mlp.experts.110.down_proj", "model.layers.58.mlp.experts.111.down_proj", "model.layers.58.mlp.experts.112.down_proj", "model.layers.58.mlp.experts.113.down_proj", "model.layers.58.mlp.experts.114.down_proj", "model.layers.58.mlp.experts.115.down_proj", "model.layers.58.mlp.experts.116.down_proj", "model.layers.58.mlp.experts.117.down_proj", "model.layers.58.mlp.experts.118.down_proj", "model.layers.58.mlp.experts.119.down_proj", "model.layers.58.mlp.experts.120.down_proj", "model.layers.58.mlp.experts.121.down_proj", "model.layers.58.mlp.experts.122.down_proj", "model.layers.58.mlp.experts.123.down_proj", "model.layers.58.mlp.experts.124.down_proj", "model.layers.58.mlp.experts.125.down_proj", "model.layers.58.mlp.experts.126.down_proj", "model.layers.58.mlp.experts.127.down_proj", "model.layers.58.mlp.experts.128.down_proj", "model.layers.58.mlp.experts.129.down_proj", "model.layers.58.mlp.experts.130.down_proj", "model.layers.58.mlp.experts.131.down_proj", "model.layers.58.mlp.experts.132.down_proj", "model.layers.58.mlp.experts.133.down_proj", "model.layers.58.mlp.experts.134.down_proj", "model.layers.58.mlp.experts.135.down_proj", "model.layers.58.mlp.experts.136.down_proj", "model.layers.58.mlp.experts.137.down_proj", "model.layers.58.mlp.experts.138.down_proj", "model.layers.58.mlp.experts.139.down_proj", "model.layers.58.mlp.experts.140.down_proj", "model.layers.58.mlp.experts.141.down_proj", "model.layers.58.mlp.experts.142.down_proj", "model.layers.58.mlp.experts.143.down_proj", "model.layers.58.mlp.experts.144.down_proj", "model.layers.58.mlp.experts.145.down_proj", "model.layers.58.mlp.experts.146.down_proj", "model.layers.58.mlp.experts.147.down_proj", "model.layers.58.mlp.experts.148.down_proj", "model.layers.58.mlp.experts.149.down_proj", "model.layers.58.mlp.experts.150.down_proj", "model.layers.58.mlp.experts.151.down_proj", "model.layers.58.mlp.experts.152.down_proj", "model.layers.58.mlp.experts.153.down_proj", "model.layers.58.mlp.experts.154.down_proj", "model.layers.58.mlp.experts.155.down_proj", "model.layers.58.mlp.experts.156.down_proj", "model.layers.58.mlp.experts.157.down_proj", "model.layers.58.mlp.experts.158.down_proj", "model.layers.58.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 1.0087154805660248e-05, "dbits": 1258291200 }, { "dkld": -9.38803423196008e-06, "dbits": 2516582400 } ] }, { "idx": 351, "layers": [ "model.layers.59.self_attn.q_proj" ], "candidates": [ { "dkld": 1.158006489277233e-06, "dbits": 62914560 }, { "dkld": 2.671864349395106e-05, "dbits": 125829120 } ] }, { "idx": 352, "layers": [ "model.layers.59.self_attn.k_proj", "model.layers.59.self_attn.v_proj" ], "candidates": [ { "dkld": -3.7124915979801915e-05, "dbits": 10485760 }, { "dkld": -3.225051332265104e-05, "dbits": 20971520 } ] }, { "idx": 353, "layers": [ "model.layers.59.self_attn.o_proj" ], "candidates": [ { "dkld": -2.164954785257439e-05, "dbits": 62914560 }, { "dkld": -1.5960447490213914e-05, "dbits": 125829120 } ] }, { "idx": 354, "layers": [ "model.layers.59.mlp.shared_experts.gate_proj", "model.layers.59.mlp.shared_experts.up_proj", "model.layers.59.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -4.581643734127144e-05, "dbits": 23592960 }, { "dkld": -4.377989098429576e-05, "dbits": 47185920 } ] }, { "idx": 355, "layers": [ "model.layers.59.mlp.experts.0.gate_proj", "model.layers.59.mlp.experts.1.gate_proj", "model.layers.59.mlp.experts.2.gate_proj", "model.layers.59.mlp.experts.3.gate_proj", "model.layers.59.mlp.experts.4.gate_proj", "model.layers.59.mlp.experts.5.gate_proj", "model.layers.59.mlp.experts.6.gate_proj", "model.layers.59.mlp.experts.7.gate_proj", "model.layers.59.mlp.experts.8.gate_proj", "model.layers.59.mlp.experts.9.gate_proj", "model.layers.59.mlp.experts.10.gate_proj", "model.layers.59.mlp.experts.11.gate_proj", "model.layers.59.mlp.experts.12.gate_proj", "model.layers.59.mlp.experts.13.gate_proj", "model.layers.59.mlp.experts.14.gate_proj", "model.layers.59.mlp.experts.15.gate_proj", "model.layers.59.mlp.experts.16.gate_proj", "model.layers.59.mlp.experts.17.gate_proj", "model.layers.59.mlp.experts.18.gate_proj", "model.layers.59.mlp.experts.19.gate_proj", "model.layers.59.mlp.experts.20.gate_proj", "model.layers.59.mlp.experts.21.gate_proj", "model.layers.59.mlp.experts.22.gate_proj", "model.layers.59.mlp.experts.23.gate_proj", "model.layers.59.mlp.experts.24.gate_proj", "model.layers.59.mlp.experts.25.gate_proj", "model.layers.59.mlp.experts.26.gate_proj", "model.layers.59.mlp.experts.27.gate_proj", "model.layers.59.mlp.experts.28.gate_proj", "model.layers.59.mlp.experts.29.gate_proj", "model.layers.59.mlp.experts.30.gate_proj", "model.layers.59.mlp.experts.31.gate_proj", "model.layers.59.mlp.experts.32.gate_proj", "model.layers.59.mlp.experts.33.gate_proj", "model.layers.59.mlp.experts.34.gate_proj", "model.layers.59.mlp.experts.35.gate_proj", "model.layers.59.mlp.experts.36.gate_proj", "model.layers.59.mlp.experts.37.gate_proj", "model.layers.59.mlp.experts.38.gate_proj", "model.layers.59.mlp.experts.39.gate_proj", "model.layers.59.mlp.experts.40.gate_proj", "model.layers.59.mlp.experts.41.gate_proj", "model.layers.59.mlp.experts.42.gate_proj", "model.layers.59.mlp.experts.43.gate_proj", "model.layers.59.mlp.experts.44.gate_proj", "model.layers.59.mlp.experts.45.gate_proj", "model.layers.59.mlp.experts.46.gate_proj", "model.layers.59.mlp.experts.47.gate_proj", "model.layers.59.mlp.experts.48.gate_proj", "model.layers.59.mlp.experts.49.gate_proj", "model.layers.59.mlp.experts.50.gate_proj", "model.layers.59.mlp.experts.51.gate_proj", "model.layers.59.mlp.experts.52.gate_proj", "model.layers.59.mlp.experts.53.gate_proj", "model.layers.59.mlp.experts.54.gate_proj", "model.layers.59.mlp.experts.55.gate_proj", "model.layers.59.mlp.experts.56.gate_proj", "model.layers.59.mlp.experts.57.gate_proj", "model.layers.59.mlp.experts.58.gate_proj", "model.layers.59.mlp.experts.59.gate_proj", "model.layers.59.mlp.experts.60.gate_proj", "model.layers.59.mlp.experts.61.gate_proj", "model.layers.59.mlp.experts.62.gate_proj", "model.layers.59.mlp.experts.63.gate_proj", "model.layers.59.mlp.experts.64.gate_proj", "model.layers.59.mlp.experts.65.gate_proj", "model.layers.59.mlp.experts.66.gate_proj", "model.layers.59.mlp.experts.67.gate_proj", "model.layers.59.mlp.experts.68.gate_proj", "model.layers.59.mlp.experts.69.gate_proj", "model.layers.59.mlp.experts.70.gate_proj", "model.layers.59.mlp.experts.71.gate_proj", "model.layers.59.mlp.experts.72.gate_proj", "model.layers.59.mlp.experts.73.gate_proj", "model.layers.59.mlp.experts.74.gate_proj", "model.layers.59.mlp.experts.75.gate_proj", "model.layers.59.mlp.experts.76.gate_proj", "model.layers.59.mlp.experts.77.gate_proj", "model.layers.59.mlp.experts.78.gate_proj", "model.layers.59.mlp.experts.79.gate_proj", "model.layers.59.mlp.experts.80.gate_proj", "model.layers.59.mlp.experts.81.gate_proj", "model.layers.59.mlp.experts.82.gate_proj", "model.layers.59.mlp.experts.83.gate_proj", "model.layers.59.mlp.experts.84.gate_proj", "model.layers.59.mlp.experts.85.gate_proj", "model.layers.59.mlp.experts.86.gate_proj", "model.layers.59.mlp.experts.87.gate_proj", "model.layers.59.mlp.experts.88.gate_proj", "model.layers.59.mlp.experts.89.gate_proj", "model.layers.59.mlp.experts.90.gate_proj", "model.layers.59.mlp.experts.91.gate_proj", "model.layers.59.mlp.experts.92.gate_proj", "model.layers.59.mlp.experts.93.gate_proj", "model.layers.59.mlp.experts.94.gate_proj", "model.layers.59.mlp.experts.95.gate_proj", "model.layers.59.mlp.experts.96.gate_proj", "model.layers.59.mlp.experts.97.gate_proj", "model.layers.59.mlp.experts.98.gate_proj", "model.layers.59.mlp.experts.99.gate_proj", "model.layers.59.mlp.experts.100.gate_proj", "model.layers.59.mlp.experts.101.gate_proj", "model.layers.59.mlp.experts.102.gate_proj", "model.layers.59.mlp.experts.103.gate_proj", "model.layers.59.mlp.experts.104.gate_proj", "model.layers.59.mlp.experts.105.gate_proj", "model.layers.59.mlp.experts.106.gate_proj", "model.layers.59.mlp.experts.107.gate_proj", "model.layers.59.mlp.experts.108.gate_proj", "model.layers.59.mlp.experts.109.gate_proj", "model.layers.59.mlp.experts.110.gate_proj", "model.layers.59.mlp.experts.111.gate_proj", "model.layers.59.mlp.experts.112.gate_proj", "model.layers.59.mlp.experts.113.gate_proj", "model.layers.59.mlp.experts.114.gate_proj", "model.layers.59.mlp.experts.115.gate_proj", "model.layers.59.mlp.experts.116.gate_proj", "model.layers.59.mlp.experts.117.gate_proj", "model.layers.59.mlp.experts.118.gate_proj", "model.layers.59.mlp.experts.119.gate_proj", "model.layers.59.mlp.experts.120.gate_proj", "model.layers.59.mlp.experts.121.gate_proj", "model.layers.59.mlp.experts.122.gate_proj", "model.layers.59.mlp.experts.123.gate_proj", "model.layers.59.mlp.experts.124.gate_proj", "model.layers.59.mlp.experts.125.gate_proj", "model.layers.59.mlp.experts.126.gate_proj", "model.layers.59.mlp.experts.127.gate_proj", "model.layers.59.mlp.experts.128.gate_proj", "model.layers.59.mlp.experts.129.gate_proj", "model.layers.59.mlp.experts.130.gate_proj", "model.layers.59.mlp.experts.131.gate_proj", "model.layers.59.mlp.experts.132.gate_proj", "model.layers.59.mlp.experts.133.gate_proj", "model.layers.59.mlp.experts.134.gate_proj", "model.layers.59.mlp.experts.135.gate_proj", "model.layers.59.mlp.experts.136.gate_proj", "model.layers.59.mlp.experts.137.gate_proj", "model.layers.59.mlp.experts.138.gate_proj", "model.layers.59.mlp.experts.139.gate_proj", "model.layers.59.mlp.experts.140.gate_proj", "model.layers.59.mlp.experts.141.gate_proj", "model.layers.59.mlp.experts.142.gate_proj", "model.layers.59.mlp.experts.143.gate_proj", "model.layers.59.mlp.experts.144.gate_proj", "model.layers.59.mlp.experts.145.gate_proj", "model.layers.59.mlp.experts.146.gate_proj", "model.layers.59.mlp.experts.147.gate_proj", "model.layers.59.mlp.experts.148.gate_proj", "model.layers.59.mlp.experts.149.gate_proj", "model.layers.59.mlp.experts.150.gate_proj", "model.layers.59.mlp.experts.151.gate_proj", "model.layers.59.mlp.experts.152.gate_proj", "model.layers.59.mlp.experts.153.gate_proj", "model.layers.59.mlp.experts.154.gate_proj", "model.layers.59.mlp.experts.155.gate_proj", "model.layers.59.mlp.experts.156.gate_proj", "model.layers.59.mlp.experts.157.gate_proj", "model.layers.59.mlp.experts.158.gate_proj", "model.layers.59.mlp.experts.159.gate_proj", "model.layers.59.mlp.experts.0.up_proj", "model.layers.59.mlp.experts.1.up_proj", "model.layers.59.mlp.experts.2.up_proj", "model.layers.59.mlp.experts.3.up_proj", "model.layers.59.mlp.experts.4.up_proj", "model.layers.59.mlp.experts.5.up_proj", "model.layers.59.mlp.experts.6.up_proj", "model.layers.59.mlp.experts.7.up_proj", "model.layers.59.mlp.experts.8.up_proj", "model.layers.59.mlp.experts.9.up_proj", "model.layers.59.mlp.experts.10.up_proj", "model.layers.59.mlp.experts.11.up_proj", "model.layers.59.mlp.experts.12.up_proj", "model.layers.59.mlp.experts.13.up_proj", "model.layers.59.mlp.experts.14.up_proj", "model.layers.59.mlp.experts.15.up_proj", "model.layers.59.mlp.experts.16.up_proj", "model.layers.59.mlp.experts.17.up_proj", "model.layers.59.mlp.experts.18.up_proj", "model.layers.59.mlp.experts.19.up_proj", "model.layers.59.mlp.experts.20.up_proj", "model.layers.59.mlp.experts.21.up_proj", "model.layers.59.mlp.experts.22.up_proj", "model.layers.59.mlp.experts.23.up_proj", "model.layers.59.mlp.experts.24.up_proj", "model.layers.59.mlp.experts.25.up_proj", "model.layers.59.mlp.experts.26.up_proj", "model.layers.59.mlp.experts.27.up_proj", "model.layers.59.mlp.experts.28.up_proj", "model.layers.59.mlp.experts.29.up_proj", "model.layers.59.mlp.experts.30.up_proj", "model.layers.59.mlp.experts.31.up_proj", "model.layers.59.mlp.experts.32.up_proj", "model.layers.59.mlp.experts.33.up_proj", "model.layers.59.mlp.experts.34.up_proj", "model.layers.59.mlp.experts.35.up_proj", "model.layers.59.mlp.experts.36.up_proj", "model.layers.59.mlp.experts.37.up_proj", "model.layers.59.mlp.experts.38.up_proj", "model.layers.59.mlp.experts.39.up_proj", "model.layers.59.mlp.experts.40.up_proj", "model.layers.59.mlp.experts.41.up_proj", "model.layers.59.mlp.experts.42.up_proj", "model.layers.59.mlp.experts.43.up_proj", "model.layers.59.mlp.experts.44.up_proj", "model.layers.59.mlp.experts.45.up_proj", "model.layers.59.mlp.experts.46.up_proj", "model.layers.59.mlp.experts.47.up_proj", "model.layers.59.mlp.experts.48.up_proj", "model.layers.59.mlp.experts.49.up_proj", "model.layers.59.mlp.experts.50.up_proj", "model.layers.59.mlp.experts.51.up_proj", "model.layers.59.mlp.experts.52.up_proj", "model.layers.59.mlp.experts.53.up_proj", "model.layers.59.mlp.experts.54.up_proj", "model.layers.59.mlp.experts.55.up_proj", "model.layers.59.mlp.experts.56.up_proj", "model.layers.59.mlp.experts.57.up_proj", "model.layers.59.mlp.experts.58.up_proj", "model.layers.59.mlp.experts.59.up_proj", "model.layers.59.mlp.experts.60.up_proj", "model.layers.59.mlp.experts.61.up_proj", "model.layers.59.mlp.experts.62.up_proj", "model.layers.59.mlp.experts.63.up_proj", "model.layers.59.mlp.experts.64.up_proj", "model.layers.59.mlp.experts.65.up_proj", "model.layers.59.mlp.experts.66.up_proj", "model.layers.59.mlp.experts.67.up_proj", "model.layers.59.mlp.experts.68.up_proj", "model.layers.59.mlp.experts.69.up_proj", "model.layers.59.mlp.experts.70.up_proj", "model.layers.59.mlp.experts.71.up_proj", "model.layers.59.mlp.experts.72.up_proj", "model.layers.59.mlp.experts.73.up_proj", "model.layers.59.mlp.experts.74.up_proj", "model.layers.59.mlp.experts.75.up_proj", "model.layers.59.mlp.experts.76.up_proj", "model.layers.59.mlp.experts.77.up_proj", "model.layers.59.mlp.experts.78.up_proj", "model.layers.59.mlp.experts.79.up_proj", "model.layers.59.mlp.experts.80.up_proj", "model.layers.59.mlp.experts.81.up_proj", "model.layers.59.mlp.experts.82.up_proj", "model.layers.59.mlp.experts.83.up_proj", "model.layers.59.mlp.experts.84.up_proj", "model.layers.59.mlp.experts.85.up_proj", "model.layers.59.mlp.experts.86.up_proj", "model.layers.59.mlp.experts.87.up_proj", "model.layers.59.mlp.experts.88.up_proj", "model.layers.59.mlp.experts.89.up_proj", "model.layers.59.mlp.experts.90.up_proj", "model.layers.59.mlp.experts.91.up_proj", "model.layers.59.mlp.experts.92.up_proj", "model.layers.59.mlp.experts.93.up_proj", "model.layers.59.mlp.experts.94.up_proj", "model.layers.59.mlp.experts.95.up_proj", "model.layers.59.mlp.experts.96.up_proj", "model.layers.59.mlp.experts.97.up_proj", "model.layers.59.mlp.experts.98.up_proj", "model.layers.59.mlp.experts.99.up_proj", "model.layers.59.mlp.experts.100.up_proj", "model.layers.59.mlp.experts.101.up_proj", "model.layers.59.mlp.experts.102.up_proj", "model.layers.59.mlp.experts.103.up_proj", "model.layers.59.mlp.experts.104.up_proj", "model.layers.59.mlp.experts.105.up_proj", "model.layers.59.mlp.experts.106.up_proj", "model.layers.59.mlp.experts.107.up_proj", "model.layers.59.mlp.experts.108.up_proj", "model.layers.59.mlp.experts.109.up_proj", "model.layers.59.mlp.experts.110.up_proj", "model.layers.59.mlp.experts.111.up_proj", "model.layers.59.mlp.experts.112.up_proj", "model.layers.59.mlp.experts.113.up_proj", "model.layers.59.mlp.experts.114.up_proj", "model.layers.59.mlp.experts.115.up_proj", "model.layers.59.mlp.experts.116.up_proj", "model.layers.59.mlp.experts.117.up_proj", "model.layers.59.mlp.experts.118.up_proj", "model.layers.59.mlp.experts.119.up_proj", "model.layers.59.mlp.experts.120.up_proj", "model.layers.59.mlp.experts.121.up_proj", "model.layers.59.mlp.experts.122.up_proj", "model.layers.59.mlp.experts.123.up_proj", "model.layers.59.mlp.experts.124.up_proj", "model.layers.59.mlp.experts.125.up_proj", "model.layers.59.mlp.experts.126.up_proj", "model.layers.59.mlp.experts.127.up_proj", "model.layers.59.mlp.experts.128.up_proj", "model.layers.59.mlp.experts.129.up_proj", "model.layers.59.mlp.experts.130.up_proj", "model.layers.59.mlp.experts.131.up_proj", "model.layers.59.mlp.experts.132.up_proj", "model.layers.59.mlp.experts.133.up_proj", "model.layers.59.mlp.experts.134.up_proj", "model.layers.59.mlp.experts.135.up_proj", "model.layers.59.mlp.experts.136.up_proj", "model.layers.59.mlp.experts.137.up_proj", "model.layers.59.mlp.experts.138.up_proj", "model.layers.59.mlp.experts.139.up_proj", "model.layers.59.mlp.experts.140.up_proj", "model.layers.59.mlp.experts.141.up_proj", "model.layers.59.mlp.experts.142.up_proj", "model.layers.59.mlp.experts.143.up_proj", "model.layers.59.mlp.experts.144.up_proj", "model.layers.59.mlp.experts.145.up_proj", "model.layers.59.mlp.experts.146.up_proj", "model.layers.59.mlp.experts.147.up_proj", "model.layers.59.mlp.experts.148.up_proj", "model.layers.59.mlp.experts.149.up_proj", "model.layers.59.mlp.experts.150.up_proj", "model.layers.59.mlp.experts.151.up_proj", "model.layers.59.mlp.experts.152.up_proj", "model.layers.59.mlp.experts.153.up_proj", "model.layers.59.mlp.experts.154.up_proj", "model.layers.59.mlp.experts.155.up_proj", "model.layers.59.mlp.experts.156.up_proj", "model.layers.59.mlp.experts.157.up_proj", "model.layers.59.mlp.experts.158.up_proj", "model.layers.59.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 2.0923139527440765e-05, "dbits": 2516582400 }, { "dkld": 1.5233014710248557e-05, "dbits": 5033164800 } ] }, { "idx": 356, "layers": [ "model.layers.59.mlp.experts.0.down_proj", "model.layers.59.mlp.experts.1.down_proj", "model.layers.59.mlp.experts.2.down_proj", "model.layers.59.mlp.experts.3.down_proj", "model.layers.59.mlp.experts.4.down_proj", "model.layers.59.mlp.experts.5.down_proj", "model.layers.59.mlp.experts.6.down_proj", "model.layers.59.mlp.experts.7.down_proj", "model.layers.59.mlp.experts.8.down_proj", "model.layers.59.mlp.experts.9.down_proj", "model.layers.59.mlp.experts.10.down_proj", "model.layers.59.mlp.experts.11.down_proj", "model.layers.59.mlp.experts.12.down_proj", "model.layers.59.mlp.experts.13.down_proj", "model.layers.59.mlp.experts.14.down_proj", "model.layers.59.mlp.experts.15.down_proj", "model.layers.59.mlp.experts.16.down_proj", "model.layers.59.mlp.experts.17.down_proj", "model.layers.59.mlp.experts.18.down_proj", "model.layers.59.mlp.experts.19.down_proj", "model.layers.59.mlp.experts.20.down_proj", "model.layers.59.mlp.experts.21.down_proj", "model.layers.59.mlp.experts.22.down_proj", "model.layers.59.mlp.experts.23.down_proj", "model.layers.59.mlp.experts.24.down_proj", "model.layers.59.mlp.experts.25.down_proj", "model.layers.59.mlp.experts.26.down_proj", "model.layers.59.mlp.experts.27.down_proj", "model.layers.59.mlp.experts.28.down_proj", "model.layers.59.mlp.experts.29.down_proj", "model.layers.59.mlp.experts.30.down_proj", "model.layers.59.mlp.experts.31.down_proj", "model.layers.59.mlp.experts.32.down_proj", "model.layers.59.mlp.experts.33.down_proj", "model.layers.59.mlp.experts.34.down_proj", "model.layers.59.mlp.experts.35.down_proj", "model.layers.59.mlp.experts.36.down_proj", "model.layers.59.mlp.experts.37.down_proj", "model.layers.59.mlp.experts.38.down_proj", "model.layers.59.mlp.experts.39.down_proj", "model.layers.59.mlp.experts.40.down_proj", "model.layers.59.mlp.experts.41.down_proj", "model.layers.59.mlp.experts.42.down_proj", "model.layers.59.mlp.experts.43.down_proj", "model.layers.59.mlp.experts.44.down_proj", "model.layers.59.mlp.experts.45.down_proj", "model.layers.59.mlp.experts.46.down_proj", "model.layers.59.mlp.experts.47.down_proj", "model.layers.59.mlp.experts.48.down_proj", "model.layers.59.mlp.experts.49.down_proj", "model.layers.59.mlp.experts.50.down_proj", "model.layers.59.mlp.experts.51.down_proj", "model.layers.59.mlp.experts.52.down_proj", "model.layers.59.mlp.experts.53.down_proj", "model.layers.59.mlp.experts.54.down_proj", "model.layers.59.mlp.experts.55.down_proj", "model.layers.59.mlp.experts.56.down_proj", "model.layers.59.mlp.experts.57.down_proj", "model.layers.59.mlp.experts.58.down_proj", "model.layers.59.mlp.experts.59.down_proj", "model.layers.59.mlp.experts.60.down_proj", "model.layers.59.mlp.experts.61.down_proj", "model.layers.59.mlp.experts.62.down_proj", "model.layers.59.mlp.experts.63.down_proj", "model.layers.59.mlp.experts.64.down_proj", "model.layers.59.mlp.experts.65.down_proj", "model.layers.59.mlp.experts.66.down_proj", "model.layers.59.mlp.experts.67.down_proj", "model.layers.59.mlp.experts.68.down_proj", "model.layers.59.mlp.experts.69.down_proj", "model.layers.59.mlp.experts.70.down_proj", "model.layers.59.mlp.experts.71.down_proj", "model.layers.59.mlp.experts.72.down_proj", "model.layers.59.mlp.experts.73.down_proj", "model.layers.59.mlp.experts.74.down_proj", "model.layers.59.mlp.experts.75.down_proj", "model.layers.59.mlp.experts.76.down_proj", "model.layers.59.mlp.experts.77.down_proj", "model.layers.59.mlp.experts.78.down_proj", "model.layers.59.mlp.experts.79.down_proj", "model.layers.59.mlp.experts.80.down_proj", "model.layers.59.mlp.experts.81.down_proj", "model.layers.59.mlp.experts.82.down_proj", "model.layers.59.mlp.experts.83.down_proj", "model.layers.59.mlp.experts.84.down_proj", "model.layers.59.mlp.experts.85.down_proj", "model.layers.59.mlp.experts.86.down_proj", "model.layers.59.mlp.experts.87.down_proj", "model.layers.59.mlp.experts.88.down_proj", "model.layers.59.mlp.experts.89.down_proj", "model.layers.59.mlp.experts.90.down_proj", "model.layers.59.mlp.experts.91.down_proj", "model.layers.59.mlp.experts.92.down_proj", "model.layers.59.mlp.experts.93.down_proj", "model.layers.59.mlp.experts.94.down_proj", "model.layers.59.mlp.experts.95.down_proj", "model.layers.59.mlp.experts.96.down_proj", "model.layers.59.mlp.experts.97.down_proj", "model.layers.59.mlp.experts.98.down_proj", "model.layers.59.mlp.experts.99.down_proj", "model.layers.59.mlp.experts.100.down_proj", "model.layers.59.mlp.experts.101.down_proj", "model.layers.59.mlp.experts.102.down_proj", "model.layers.59.mlp.experts.103.down_proj", "model.layers.59.mlp.experts.104.down_proj", "model.layers.59.mlp.experts.105.down_proj", "model.layers.59.mlp.experts.106.down_proj", "model.layers.59.mlp.experts.107.down_proj", "model.layers.59.mlp.experts.108.down_proj", "model.layers.59.mlp.experts.109.down_proj", "model.layers.59.mlp.experts.110.down_proj", "model.layers.59.mlp.experts.111.down_proj", "model.layers.59.mlp.experts.112.down_proj", "model.layers.59.mlp.experts.113.down_proj", "model.layers.59.mlp.experts.114.down_proj", "model.layers.59.mlp.experts.115.down_proj", "model.layers.59.mlp.experts.116.down_proj", "model.layers.59.mlp.experts.117.down_proj", "model.layers.59.mlp.experts.118.down_proj", "model.layers.59.mlp.experts.119.down_proj", "model.layers.59.mlp.experts.120.down_proj", "model.layers.59.mlp.experts.121.down_proj", "model.layers.59.mlp.experts.122.down_proj", "model.layers.59.mlp.experts.123.down_proj", "model.layers.59.mlp.experts.124.down_proj", "model.layers.59.mlp.experts.125.down_proj", "model.layers.59.mlp.experts.126.down_proj", "model.layers.59.mlp.experts.127.down_proj", "model.layers.59.mlp.experts.128.down_proj", "model.layers.59.mlp.experts.129.down_proj", "model.layers.59.mlp.experts.130.down_proj", "model.layers.59.mlp.experts.131.down_proj", "model.layers.59.mlp.experts.132.down_proj", "model.layers.59.mlp.experts.133.down_proj", "model.layers.59.mlp.experts.134.down_proj", "model.layers.59.mlp.experts.135.down_proj", "model.layers.59.mlp.experts.136.down_proj", "model.layers.59.mlp.experts.137.down_proj", "model.layers.59.mlp.experts.138.down_proj", "model.layers.59.mlp.experts.139.down_proj", "model.layers.59.mlp.experts.140.down_proj", "model.layers.59.mlp.experts.141.down_proj", "model.layers.59.mlp.experts.142.down_proj", "model.layers.59.mlp.experts.143.down_proj", "model.layers.59.mlp.experts.144.down_proj", "model.layers.59.mlp.experts.145.down_proj", "model.layers.59.mlp.experts.146.down_proj", "model.layers.59.mlp.experts.147.down_proj", "model.layers.59.mlp.experts.148.down_proj", "model.layers.59.mlp.experts.149.down_proj", "model.layers.59.mlp.experts.150.down_proj", "model.layers.59.mlp.experts.151.down_proj", "model.layers.59.mlp.experts.152.down_proj", "model.layers.59.mlp.experts.153.down_proj", "model.layers.59.mlp.experts.154.down_proj", "model.layers.59.mlp.experts.155.down_proj", "model.layers.59.mlp.experts.156.down_proj", "model.layers.59.mlp.experts.157.down_proj", "model.layers.59.mlp.experts.158.down_proj", "model.layers.59.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.1551403440534722e-05, "dbits": 1258291200 }, { "dkld": -7.769674994051456e-06, "dbits": 2516582400 } ] }, { "idx": 357, "layers": [ "model.layers.60.self_attn.q_proj" ], "candidates": [ { "dkld": -2.6557035744188828e-05, "dbits": 62914560 }, { "dkld": -2.0465301349758408e-05, "dbits": 125829120 } ] }, { "idx": 358, "layers": [ "model.layers.60.self_attn.k_proj", "model.layers.60.self_attn.v_proj" ], "candidates": [ { "dkld": -4.8152520321309566e-05, "dbits": 10485760 }, { "dkld": -8.331285789608955e-05, "dbits": 20971520 } ] }, { "idx": 359, "layers": [ "model.layers.60.self_attn.o_proj" ], "candidates": [ { "dkld": -5.208002403377446e-06, "dbits": 62914560 }, { "dkld": 2.0450190640987354e-05, "dbits": 125829120 } ] }, { "idx": 360, "layers": [ "model.layers.60.mlp.shared_experts.gate_proj", "model.layers.60.mlp.shared_experts.up_proj", "model.layers.60.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -3.222939558327094e-05, "dbits": 23592960 }, { "dkld": -3.76473879441612e-05, "dbits": 47185920 } ] }, { "idx": 361, "layers": [ "model.layers.60.mlp.experts.0.gate_proj", "model.layers.60.mlp.experts.1.gate_proj", "model.layers.60.mlp.experts.2.gate_proj", "model.layers.60.mlp.experts.3.gate_proj", "model.layers.60.mlp.experts.4.gate_proj", "model.layers.60.mlp.experts.5.gate_proj", "model.layers.60.mlp.experts.6.gate_proj", "model.layers.60.mlp.experts.7.gate_proj", "model.layers.60.mlp.experts.8.gate_proj", "model.layers.60.mlp.experts.9.gate_proj", "model.layers.60.mlp.experts.10.gate_proj", "model.layers.60.mlp.experts.11.gate_proj", "model.layers.60.mlp.experts.12.gate_proj", "model.layers.60.mlp.experts.13.gate_proj", "model.layers.60.mlp.experts.14.gate_proj", "model.layers.60.mlp.experts.15.gate_proj", "model.layers.60.mlp.experts.16.gate_proj", "model.layers.60.mlp.experts.17.gate_proj", "model.layers.60.mlp.experts.18.gate_proj", "model.layers.60.mlp.experts.19.gate_proj", "model.layers.60.mlp.experts.20.gate_proj", "model.layers.60.mlp.experts.21.gate_proj", "model.layers.60.mlp.experts.22.gate_proj", "model.layers.60.mlp.experts.23.gate_proj", "model.layers.60.mlp.experts.24.gate_proj", "model.layers.60.mlp.experts.25.gate_proj", "model.layers.60.mlp.experts.26.gate_proj", "model.layers.60.mlp.experts.27.gate_proj", "model.layers.60.mlp.experts.28.gate_proj", "model.layers.60.mlp.experts.29.gate_proj", "model.layers.60.mlp.experts.30.gate_proj", "model.layers.60.mlp.experts.31.gate_proj", "model.layers.60.mlp.experts.32.gate_proj", "model.layers.60.mlp.experts.33.gate_proj", "model.layers.60.mlp.experts.34.gate_proj", "model.layers.60.mlp.experts.35.gate_proj", "model.layers.60.mlp.experts.36.gate_proj", "model.layers.60.mlp.experts.37.gate_proj", "model.layers.60.mlp.experts.38.gate_proj", "model.layers.60.mlp.experts.39.gate_proj", "model.layers.60.mlp.experts.40.gate_proj", "model.layers.60.mlp.experts.41.gate_proj", "model.layers.60.mlp.experts.42.gate_proj", "model.layers.60.mlp.experts.43.gate_proj", "model.layers.60.mlp.experts.44.gate_proj", "model.layers.60.mlp.experts.45.gate_proj", "model.layers.60.mlp.experts.46.gate_proj", "model.layers.60.mlp.experts.47.gate_proj", "model.layers.60.mlp.experts.48.gate_proj", "model.layers.60.mlp.experts.49.gate_proj", "model.layers.60.mlp.experts.50.gate_proj", "model.layers.60.mlp.experts.51.gate_proj", "model.layers.60.mlp.experts.52.gate_proj", "model.layers.60.mlp.experts.53.gate_proj", "model.layers.60.mlp.experts.54.gate_proj", "model.layers.60.mlp.experts.55.gate_proj", "model.layers.60.mlp.experts.56.gate_proj", "model.layers.60.mlp.experts.57.gate_proj", "model.layers.60.mlp.experts.58.gate_proj", "model.layers.60.mlp.experts.59.gate_proj", "model.layers.60.mlp.experts.60.gate_proj", "model.layers.60.mlp.experts.61.gate_proj", "model.layers.60.mlp.experts.62.gate_proj", "model.layers.60.mlp.experts.63.gate_proj", "model.layers.60.mlp.experts.64.gate_proj", "model.layers.60.mlp.experts.65.gate_proj", "model.layers.60.mlp.experts.66.gate_proj", "model.layers.60.mlp.experts.67.gate_proj", "model.layers.60.mlp.experts.68.gate_proj", "model.layers.60.mlp.experts.69.gate_proj", "model.layers.60.mlp.experts.70.gate_proj", "model.layers.60.mlp.experts.71.gate_proj", "model.layers.60.mlp.experts.72.gate_proj", "model.layers.60.mlp.experts.73.gate_proj", "model.layers.60.mlp.experts.74.gate_proj", "model.layers.60.mlp.experts.75.gate_proj", "model.layers.60.mlp.experts.76.gate_proj", "model.layers.60.mlp.experts.77.gate_proj", "model.layers.60.mlp.experts.78.gate_proj", "model.layers.60.mlp.experts.79.gate_proj", "model.layers.60.mlp.experts.80.gate_proj", "model.layers.60.mlp.experts.81.gate_proj", "model.layers.60.mlp.experts.82.gate_proj", "model.layers.60.mlp.experts.83.gate_proj", "model.layers.60.mlp.experts.84.gate_proj", "model.layers.60.mlp.experts.85.gate_proj", "model.layers.60.mlp.experts.86.gate_proj", "model.layers.60.mlp.experts.87.gate_proj", "model.layers.60.mlp.experts.88.gate_proj", "model.layers.60.mlp.experts.89.gate_proj", "model.layers.60.mlp.experts.90.gate_proj", "model.layers.60.mlp.experts.91.gate_proj", "model.layers.60.mlp.experts.92.gate_proj", "model.layers.60.mlp.experts.93.gate_proj", "model.layers.60.mlp.experts.94.gate_proj", "model.layers.60.mlp.experts.95.gate_proj", "model.layers.60.mlp.experts.96.gate_proj", "model.layers.60.mlp.experts.97.gate_proj", "model.layers.60.mlp.experts.98.gate_proj", "model.layers.60.mlp.experts.99.gate_proj", "model.layers.60.mlp.experts.100.gate_proj", "model.layers.60.mlp.experts.101.gate_proj", "model.layers.60.mlp.experts.102.gate_proj", "model.layers.60.mlp.experts.103.gate_proj", "model.layers.60.mlp.experts.104.gate_proj", "model.layers.60.mlp.experts.105.gate_proj", "model.layers.60.mlp.experts.106.gate_proj", "model.layers.60.mlp.experts.107.gate_proj", "model.layers.60.mlp.experts.108.gate_proj", "model.layers.60.mlp.experts.109.gate_proj", "model.layers.60.mlp.experts.110.gate_proj", "model.layers.60.mlp.experts.111.gate_proj", "model.layers.60.mlp.experts.112.gate_proj", "model.layers.60.mlp.experts.113.gate_proj", "model.layers.60.mlp.experts.114.gate_proj", "model.layers.60.mlp.experts.115.gate_proj", "model.layers.60.mlp.experts.116.gate_proj", "model.layers.60.mlp.experts.117.gate_proj", "model.layers.60.mlp.experts.118.gate_proj", "model.layers.60.mlp.experts.119.gate_proj", "model.layers.60.mlp.experts.120.gate_proj", "model.layers.60.mlp.experts.121.gate_proj", "model.layers.60.mlp.experts.122.gate_proj", "model.layers.60.mlp.experts.123.gate_proj", "model.layers.60.mlp.experts.124.gate_proj", "model.layers.60.mlp.experts.125.gate_proj", "model.layers.60.mlp.experts.126.gate_proj", "model.layers.60.mlp.experts.127.gate_proj", "model.layers.60.mlp.experts.128.gate_proj", "model.layers.60.mlp.experts.129.gate_proj", "model.layers.60.mlp.experts.130.gate_proj", "model.layers.60.mlp.experts.131.gate_proj", "model.layers.60.mlp.experts.132.gate_proj", "model.layers.60.mlp.experts.133.gate_proj", "model.layers.60.mlp.experts.134.gate_proj", "model.layers.60.mlp.experts.135.gate_proj", "model.layers.60.mlp.experts.136.gate_proj", "model.layers.60.mlp.experts.137.gate_proj", "model.layers.60.mlp.experts.138.gate_proj", "model.layers.60.mlp.experts.139.gate_proj", "model.layers.60.mlp.experts.140.gate_proj", "model.layers.60.mlp.experts.141.gate_proj", "model.layers.60.mlp.experts.142.gate_proj", "model.layers.60.mlp.experts.143.gate_proj", "model.layers.60.mlp.experts.144.gate_proj", "model.layers.60.mlp.experts.145.gate_proj", "model.layers.60.mlp.experts.146.gate_proj", "model.layers.60.mlp.experts.147.gate_proj", "model.layers.60.mlp.experts.148.gate_proj", "model.layers.60.mlp.experts.149.gate_proj", "model.layers.60.mlp.experts.150.gate_proj", "model.layers.60.mlp.experts.151.gate_proj", "model.layers.60.mlp.experts.152.gate_proj", "model.layers.60.mlp.experts.153.gate_proj", "model.layers.60.mlp.experts.154.gate_proj", "model.layers.60.mlp.experts.155.gate_proj", "model.layers.60.mlp.experts.156.gate_proj", "model.layers.60.mlp.experts.157.gate_proj", "model.layers.60.mlp.experts.158.gate_proj", "model.layers.60.mlp.experts.159.gate_proj", "model.layers.60.mlp.experts.0.up_proj", "model.layers.60.mlp.experts.1.up_proj", "model.layers.60.mlp.experts.2.up_proj", "model.layers.60.mlp.experts.3.up_proj", "model.layers.60.mlp.experts.4.up_proj", "model.layers.60.mlp.experts.5.up_proj", "model.layers.60.mlp.experts.6.up_proj", "model.layers.60.mlp.experts.7.up_proj", "model.layers.60.mlp.experts.8.up_proj", "model.layers.60.mlp.experts.9.up_proj", "model.layers.60.mlp.experts.10.up_proj", "model.layers.60.mlp.experts.11.up_proj", "model.layers.60.mlp.experts.12.up_proj", "model.layers.60.mlp.experts.13.up_proj", "model.layers.60.mlp.experts.14.up_proj", "model.layers.60.mlp.experts.15.up_proj", "model.layers.60.mlp.experts.16.up_proj", "model.layers.60.mlp.experts.17.up_proj", "model.layers.60.mlp.experts.18.up_proj", "model.layers.60.mlp.experts.19.up_proj", "model.layers.60.mlp.experts.20.up_proj", "model.layers.60.mlp.experts.21.up_proj", "model.layers.60.mlp.experts.22.up_proj", "model.layers.60.mlp.experts.23.up_proj", "model.layers.60.mlp.experts.24.up_proj", "model.layers.60.mlp.experts.25.up_proj", "model.layers.60.mlp.experts.26.up_proj", "model.layers.60.mlp.experts.27.up_proj", "model.layers.60.mlp.experts.28.up_proj", "model.layers.60.mlp.experts.29.up_proj", "model.layers.60.mlp.experts.30.up_proj", "model.layers.60.mlp.experts.31.up_proj", "model.layers.60.mlp.experts.32.up_proj", "model.layers.60.mlp.experts.33.up_proj", "model.layers.60.mlp.experts.34.up_proj", "model.layers.60.mlp.experts.35.up_proj", "model.layers.60.mlp.experts.36.up_proj", "model.layers.60.mlp.experts.37.up_proj", "model.layers.60.mlp.experts.38.up_proj", "model.layers.60.mlp.experts.39.up_proj", "model.layers.60.mlp.experts.40.up_proj", "model.layers.60.mlp.experts.41.up_proj", "model.layers.60.mlp.experts.42.up_proj", "model.layers.60.mlp.experts.43.up_proj", "model.layers.60.mlp.experts.44.up_proj", "model.layers.60.mlp.experts.45.up_proj", "model.layers.60.mlp.experts.46.up_proj", "model.layers.60.mlp.experts.47.up_proj", "model.layers.60.mlp.experts.48.up_proj", "model.layers.60.mlp.experts.49.up_proj", "model.layers.60.mlp.experts.50.up_proj", "model.layers.60.mlp.experts.51.up_proj", "model.layers.60.mlp.experts.52.up_proj", "model.layers.60.mlp.experts.53.up_proj", "model.layers.60.mlp.experts.54.up_proj", "model.layers.60.mlp.experts.55.up_proj", "model.layers.60.mlp.experts.56.up_proj", "model.layers.60.mlp.experts.57.up_proj", "model.layers.60.mlp.experts.58.up_proj", "model.layers.60.mlp.experts.59.up_proj", "model.layers.60.mlp.experts.60.up_proj", "model.layers.60.mlp.experts.61.up_proj", "model.layers.60.mlp.experts.62.up_proj", "model.layers.60.mlp.experts.63.up_proj", "model.layers.60.mlp.experts.64.up_proj", "model.layers.60.mlp.experts.65.up_proj", "model.layers.60.mlp.experts.66.up_proj", "model.layers.60.mlp.experts.67.up_proj", "model.layers.60.mlp.experts.68.up_proj", "model.layers.60.mlp.experts.69.up_proj", "model.layers.60.mlp.experts.70.up_proj", "model.layers.60.mlp.experts.71.up_proj", "model.layers.60.mlp.experts.72.up_proj", "model.layers.60.mlp.experts.73.up_proj", "model.layers.60.mlp.experts.74.up_proj", "model.layers.60.mlp.experts.75.up_proj", "model.layers.60.mlp.experts.76.up_proj", "model.layers.60.mlp.experts.77.up_proj", "model.layers.60.mlp.experts.78.up_proj", "model.layers.60.mlp.experts.79.up_proj", "model.layers.60.mlp.experts.80.up_proj", "model.layers.60.mlp.experts.81.up_proj", "model.layers.60.mlp.experts.82.up_proj", "model.layers.60.mlp.experts.83.up_proj", "model.layers.60.mlp.experts.84.up_proj", "model.layers.60.mlp.experts.85.up_proj", "model.layers.60.mlp.experts.86.up_proj", "model.layers.60.mlp.experts.87.up_proj", "model.layers.60.mlp.experts.88.up_proj", "model.layers.60.mlp.experts.89.up_proj", "model.layers.60.mlp.experts.90.up_proj", "model.layers.60.mlp.experts.91.up_proj", "model.layers.60.mlp.experts.92.up_proj", "model.layers.60.mlp.experts.93.up_proj", "model.layers.60.mlp.experts.94.up_proj", "model.layers.60.mlp.experts.95.up_proj", "model.layers.60.mlp.experts.96.up_proj", "model.layers.60.mlp.experts.97.up_proj", "model.layers.60.mlp.experts.98.up_proj", "model.layers.60.mlp.experts.99.up_proj", "model.layers.60.mlp.experts.100.up_proj", "model.layers.60.mlp.experts.101.up_proj", "model.layers.60.mlp.experts.102.up_proj", "model.layers.60.mlp.experts.103.up_proj", "model.layers.60.mlp.experts.104.up_proj", "model.layers.60.mlp.experts.105.up_proj", "model.layers.60.mlp.experts.106.up_proj", "model.layers.60.mlp.experts.107.up_proj", "model.layers.60.mlp.experts.108.up_proj", "model.layers.60.mlp.experts.109.up_proj", "model.layers.60.mlp.experts.110.up_proj", "model.layers.60.mlp.experts.111.up_proj", "model.layers.60.mlp.experts.112.up_proj", "model.layers.60.mlp.experts.113.up_proj", "model.layers.60.mlp.experts.114.up_proj", "model.layers.60.mlp.experts.115.up_proj", "model.layers.60.mlp.experts.116.up_proj", "model.layers.60.mlp.experts.117.up_proj", "model.layers.60.mlp.experts.118.up_proj", "model.layers.60.mlp.experts.119.up_proj", "model.layers.60.mlp.experts.120.up_proj", "model.layers.60.mlp.experts.121.up_proj", "model.layers.60.mlp.experts.122.up_proj", "model.layers.60.mlp.experts.123.up_proj", "model.layers.60.mlp.experts.124.up_proj", "model.layers.60.mlp.experts.125.up_proj", "model.layers.60.mlp.experts.126.up_proj", "model.layers.60.mlp.experts.127.up_proj", "model.layers.60.mlp.experts.128.up_proj", "model.layers.60.mlp.experts.129.up_proj", "model.layers.60.mlp.experts.130.up_proj", "model.layers.60.mlp.experts.131.up_proj", "model.layers.60.mlp.experts.132.up_proj", "model.layers.60.mlp.experts.133.up_proj", "model.layers.60.mlp.experts.134.up_proj", "model.layers.60.mlp.experts.135.up_proj", "model.layers.60.mlp.experts.136.up_proj", "model.layers.60.mlp.experts.137.up_proj", "model.layers.60.mlp.experts.138.up_proj", "model.layers.60.mlp.experts.139.up_proj", "model.layers.60.mlp.experts.140.up_proj", "model.layers.60.mlp.experts.141.up_proj", "model.layers.60.mlp.experts.142.up_proj", "model.layers.60.mlp.experts.143.up_proj", "model.layers.60.mlp.experts.144.up_proj", "model.layers.60.mlp.experts.145.up_proj", "model.layers.60.mlp.experts.146.up_proj", "model.layers.60.mlp.experts.147.up_proj", "model.layers.60.mlp.experts.148.up_proj", "model.layers.60.mlp.experts.149.up_proj", "model.layers.60.mlp.experts.150.up_proj", "model.layers.60.mlp.experts.151.up_proj", "model.layers.60.mlp.experts.152.up_proj", "model.layers.60.mlp.experts.153.up_proj", "model.layers.60.mlp.experts.154.up_proj", "model.layers.60.mlp.experts.155.up_proj", "model.layers.60.mlp.experts.156.up_proj", "model.layers.60.mlp.experts.157.up_proj", "model.layers.60.mlp.experts.158.up_proj", "model.layers.60.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 6.31110742688179e-06, "dbits": 2516582400 }, { "dkld": -2.0711449906229973e-06, "dbits": 5033164800 } ] }, { "idx": 362, "layers": [ "model.layers.60.mlp.experts.0.down_proj", "model.layers.60.mlp.experts.1.down_proj", "model.layers.60.mlp.experts.2.down_proj", "model.layers.60.mlp.experts.3.down_proj", "model.layers.60.mlp.experts.4.down_proj", "model.layers.60.mlp.experts.5.down_proj", "model.layers.60.mlp.experts.6.down_proj", "model.layers.60.mlp.experts.7.down_proj", "model.layers.60.mlp.experts.8.down_proj", "model.layers.60.mlp.experts.9.down_proj", "model.layers.60.mlp.experts.10.down_proj", "model.layers.60.mlp.experts.11.down_proj", "model.layers.60.mlp.experts.12.down_proj", "model.layers.60.mlp.experts.13.down_proj", "model.layers.60.mlp.experts.14.down_proj", "model.layers.60.mlp.experts.15.down_proj", "model.layers.60.mlp.experts.16.down_proj", "model.layers.60.mlp.experts.17.down_proj", "model.layers.60.mlp.experts.18.down_proj", "model.layers.60.mlp.experts.19.down_proj", "model.layers.60.mlp.experts.20.down_proj", "model.layers.60.mlp.experts.21.down_proj", "model.layers.60.mlp.experts.22.down_proj", "model.layers.60.mlp.experts.23.down_proj", "model.layers.60.mlp.experts.24.down_proj", "model.layers.60.mlp.experts.25.down_proj", "model.layers.60.mlp.experts.26.down_proj", "model.layers.60.mlp.experts.27.down_proj", "model.layers.60.mlp.experts.28.down_proj", "model.layers.60.mlp.experts.29.down_proj", "model.layers.60.mlp.experts.30.down_proj", "model.layers.60.mlp.experts.31.down_proj", "model.layers.60.mlp.experts.32.down_proj", "model.layers.60.mlp.experts.33.down_proj", "model.layers.60.mlp.experts.34.down_proj", "model.layers.60.mlp.experts.35.down_proj", "model.layers.60.mlp.experts.36.down_proj", "model.layers.60.mlp.experts.37.down_proj", "model.layers.60.mlp.experts.38.down_proj", "model.layers.60.mlp.experts.39.down_proj", "model.layers.60.mlp.experts.40.down_proj", "model.layers.60.mlp.experts.41.down_proj", "model.layers.60.mlp.experts.42.down_proj", "model.layers.60.mlp.experts.43.down_proj", "model.layers.60.mlp.experts.44.down_proj", "model.layers.60.mlp.experts.45.down_proj", "model.layers.60.mlp.experts.46.down_proj", "model.layers.60.mlp.experts.47.down_proj", "model.layers.60.mlp.experts.48.down_proj", "model.layers.60.mlp.experts.49.down_proj", "model.layers.60.mlp.experts.50.down_proj", "model.layers.60.mlp.experts.51.down_proj", "model.layers.60.mlp.experts.52.down_proj", "model.layers.60.mlp.experts.53.down_proj", "model.layers.60.mlp.experts.54.down_proj", "model.layers.60.mlp.experts.55.down_proj", "model.layers.60.mlp.experts.56.down_proj", "model.layers.60.mlp.experts.57.down_proj", "model.layers.60.mlp.experts.58.down_proj", "model.layers.60.mlp.experts.59.down_proj", "model.layers.60.mlp.experts.60.down_proj", "model.layers.60.mlp.experts.61.down_proj", "model.layers.60.mlp.experts.62.down_proj", "model.layers.60.mlp.experts.63.down_proj", "model.layers.60.mlp.experts.64.down_proj", "model.layers.60.mlp.experts.65.down_proj", "model.layers.60.mlp.experts.66.down_proj", "model.layers.60.mlp.experts.67.down_proj", "model.layers.60.mlp.experts.68.down_proj", "model.layers.60.mlp.experts.69.down_proj", "model.layers.60.mlp.experts.70.down_proj", "model.layers.60.mlp.experts.71.down_proj", "model.layers.60.mlp.experts.72.down_proj", "model.layers.60.mlp.experts.73.down_proj", "model.layers.60.mlp.experts.74.down_proj", "model.layers.60.mlp.experts.75.down_proj", "model.layers.60.mlp.experts.76.down_proj", "model.layers.60.mlp.experts.77.down_proj", "model.layers.60.mlp.experts.78.down_proj", "model.layers.60.mlp.experts.79.down_proj", "model.layers.60.mlp.experts.80.down_proj", "model.layers.60.mlp.experts.81.down_proj", "model.layers.60.mlp.experts.82.down_proj", "model.layers.60.mlp.experts.83.down_proj", "model.layers.60.mlp.experts.84.down_proj", "model.layers.60.mlp.experts.85.down_proj", "model.layers.60.mlp.experts.86.down_proj", "model.layers.60.mlp.experts.87.down_proj", "model.layers.60.mlp.experts.88.down_proj", "model.layers.60.mlp.experts.89.down_proj", "model.layers.60.mlp.experts.90.down_proj", "model.layers.60.mlp.experts.91.down_proj", "model.layers.60.mlp.experts.92.down_proj", "model.layers.60.mlp.experts.93.down_proj", "model.layers.60.mlp.experts.94.down_proj", "model.layers.60.mlp.experts.95.down_proj", "model.layers.60.mlp.experts.96.down_proj", "model.layers.60.mlp.experts.97.down_proj", "model.layers.60.mlp.experts.98.down_proj", "model.layers.60.mlp.experts.99.down_proj", "model.layers.60.mlp.experts.100.down_proj", "model.layers.60.mlp.experts.101.down_proj", "model.layers.60.mlp.experts.102.down_proj", "model.layers.60.mlp.experts.103.down_proj", "model.layers.60.mlp.experts.104.down_proj", "model.layers.60.mlp.experts.105.down_proj", "model.layers.60.mlp.experts.106.down_proj", "model.layers.60.mlp.experts.107.down_proj", "model.layers.60.mlp.experts.108.down_proj", "model.layers.60.mlp.experts.109.down_proj", "model.layers.60.mlp.experts.110.down_proj", "model.layers.60.mlp.experts.111.down_proj", "model.layers.60.mlp.experts.112.down_proj", "model.layers.60.mlp.experts.113.down_proj", "model.layers.60.mlp.experts.114.down_proj", "model.layers.60.mlp.experts.115.down_proj", "model.layers.60.mlp.experts.116.down_proj", "model.layers.60.mlp.experts.117.down_proj", "model.layers.60.mlp.experts.118.down_proj", "model.layers.60.mlp.experts.119.down_proj", "model.layers.60.mlp.experts.120.down_proj", "model.layers.60.mlp.experts.121.down_proj", "model.layers.60.mlp.experts.122.down_proj", "model.layers.60.mlp.experts.123.down_proj", "model.layers.60.mlp.experts.124.down_proj", "model.layers.60.mlp.experts.125.down_proj", "model.layers.60.mlp.experts.126.down_proj", "model.layers.60.mlp.experts.127.down_proj", "model.layers.60.mlp.experts.128.down_proj", "model.layers.60.mlp.experts.129.down_proj", "model.layers.60.mlp.experts.130.down_proj", "model.layers.60.mlp.experts.131.down_proj", "model.layers.60.mlp.experts.132.down_proj", "model.layers.60.mlp.experts.133.down_proj", "model.layers.60.mlp.experts.134.down_proj", "model.layers.60.mlp.experts.135.down_proj", "model.layers.60.mlp.experts.136.down_proj", "model.layers.60.mlp.experts.137.down_proj", "model.layers.60.mlp.experts.138.down_proj", "model.layers.60.mlp.experts.139.down_proj", "model.layers.60.mlp.experts.140.down_proj", "model.layers.60.mlp.experts.141.down_proj", "model.layers.60.mlp.experts.142.down_proj", "model.layers.60.mlp.experts.143.down_proj", "model.layers.60.mlp.experts.144.down_proj", "model.layers.60.mlp.experts.145.down_proj", "model.layers.60.mlp.experts.146.down_proj", "model.layers.60.mlp.experts.147.down_proj", "model.layers.60.mlp.experts.148.down_proj", "model.layers.60.mlp.experts.149.down_proj", "model.layers.60.mlp.experts.150.down_proj", "model.layers.60.mlp.experts.151.down_proj", "model.layers.60.mlp.experts.152.down_proj", "model.layers.60.mlp.experts.153.down_proj", "model.layers.60.mlp.experts.154.down_proj", "model.layers.60.mlp.experts.155.down_proj", "model.layers.60.mlp.experts.156.down_proj", "model.layers.60.mlp.experts.157.down_proj", "model.layers.60.mlp.experts.158.down_proj", "model.layers.60.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.1936551891265912e-05, "dbits": 1258291200 }, { "dkld": -1.4560064300894737e-06, "dbits": 2516582400 } ] }, { "idx": 363, "layers": [ "model.layers.61.self_attn.q_proj" ], "candidates": [ { "dkld": 1.8721912056207657e-05, "dbits": 62914560 }, { "dkld": 2.2581778466701508e-05, "dbits": 125829120 } ] }, { "idx": 364, "layers": [ "model.layers.61.self_attn.k_proj", "model.layers.61.self_attn.v_proj" ], "candidates": [ { "dkld": -3.888458013533852e-06, "dbits": 10485760 }, { "dkld": -2.7801841497414326e-06, "dbits": 20971520 } ] }, { "idx": 365, "layers": [ "model.layers.61.self_attn.o_proj" ], "candidates": [ { "dkld": -1.0541593655943177e-05, "dbits": 62914560 }, { "dkld": -1.528111752122606e-05, "dbits": 125829120 } ] }, { "idx": 366, "layers": [ "model.layers.61.mlp.shared_experts.gate_proj", "model.layers.61.mlp.shared_experts.up_proj", "model.layers.61.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 1.855660229921341e-05, "dbits": 23592960 }, { "dkld": -1.004035584628582e-05, "dbits": 47185920 } ] }, { "idx": 367, "layers": [ "model.layers.61.mlp.experts.0.gate_proj", "model.layers.61.mlp.experts.1.gate_proj", "model.layers.61.mlp.experts.2.gate_proj", "model.layers.61.mlp.experts.3.gate_proj", "model.layers.61.mlp.experts.4.gate_proj", "model.layers.61.mlp.experts.5.gate_proj", "model.layers.61.mlp.experts.6.gate_proj", "model.layers.61.mlp.experts.7.gate_proj", "model.layers.61.mlp.experts.8.gate_proj", "model.layers.61.mlp.experts.9.gate_proj", "model.layers.61.mlp.experts.10.gate_proj", "model.layers.61.mlp.experts.11.gate_proj", "model.layers.61.mlp.experts.12.gate_proj", "model.layers.61.mlp.experts.13.gate_proj", "model.layers.61.mlp.experts.14.gate_proj", "model.layers.61.mlp.experts.15.gate_proj", "model.layers.61.mlp.experts.16.gate_proj", "model.layers.61.mlp.experts.17.gate_proj", "model.layers.61.mlp.experts.18.gate_proj", "model.layers.61.mlp.experts.19.gate_proj", "model.layers.61.mlp.experts.20.gate_proj", "model.layers.61.mlp.experts.21.gate_proj", "model.layers.61.mlp.experts.22.gate_proj", "model.layers.61.mlp.experts.23.gate_proj", "model.layers.61.mlp.experts.24.gate_proj", "model.layers.61.mlp.experts.25.gate_proj", "model.layers.61.mlp.experts.26.gate_proj", "model.layers.61.mlp.experts.27.gate_proj", "model.layers.61.mlp.experts.28.gate_proj", "model.layers.61.mlp.experts.29.gate_proj", "model.layers.61.mlp.experts.30.gate_proj", "model.layers.61.mlp.experts.31.gate_proj", "model.layers.61.mlp.experts.32.gate_proj", "model.layers.61.mlp.experts.33.gate_proj", "model.layers.61.mlp.experts.34.gate_proj", "model.layers.61.mlp.experts.35.gate_proj", "model.layers.61.mlp.experts.36.gate_proj", "model.layers.61.mlp.experts.37.gate_proj", "model.layers.61.mlp.experts.38.gate_proj", "model.layers.61.mlp.experts.39.gate_proj", "model.layers.61.mlp.experts.40.gate_proj", "model.layers.61.mlp.experts.41.gate_proj", "model.layers.61.mlp.experts.42.gate_proj", "model.layers.61.mlp.experts.43.gate_proj", "model.layers.61.mlp.experts.44.gate_proj", "model.layers.61.mlp.experts.45.gate_proj", "model.layers.61.mlp.experts.46.gate_proj", "model.layers.61.mlp.experts.47.gate_proj", "model.layers.61.mlp.experts.48.gate_proj", "model.layers.61.mlp.experts.49.gate_proj", "model.layers.61.mlp.experts.50.gate_proj", "model.layers.61.mlp.experts.51.gate_proj", "model.layers.61.mlp.experts.52.gate_proj", "model.layers.61.mlp.experts.53.gate_proj", "model.layers.61.mlp.experts.54.gate_proj", "model.layers.61.mlp.experts.55.gate_proj", "model.layers.61.mlp.experts.56.gate_proj", "model.layers.61.mlp.experts.57.gate_proj", "model.layers.61.mlp.experts.58.gate_proj", "model.layers.61.mlp.experts.59.gate_proj", "model.layers.61.mlp.experts.60.gate_proj", "model.layers.61.mlp.experts.61.gate_proj", "model.layers.61.mlp.experts.62.gate_proj", "model.layers.61.mlp.experts.63.gate_proj", "model.layers.61.mlp.experts.64.gate_proj", "model.layers.61.mlp.experts.65.gate_proj", "model.layers.61.mlp.experts.66.gate_proj", "model.layers.61.mlp.experts.67.gate_proj", "model.layers.61.mlp.experts.68.gate_proj", "model.layers.61.mlp.experts.69.gate_proj", "model.layers.61.mlp.experts.70.gate_proj", "model.layers.61.mlp.experts.71.gate_proj", "model.layers.61.mlp.experts.72.gate_proj", "model.layers.61.mlp.experts.73.gate_proj", "model.layers.61.mlp.experts.74.gate_proj", "model.layers.61.mlp.experts.75.gate_proj", "model.layers.61.mlp.experts.76.gate_proj", "model.layers.61.mlp.experts.77.gate_proj", "model.layers.61.mlp.experts.78.gate_proj", "model.layers.61.mlp.experts.79.gate_proj", "model.layers.61.mlp.experts.80.gate_proj", "model.layers.61.mlp.experts.81.gate_proj", "model.layers.61.mlp.experts.82.gate_proj", "model.layers.61.mlp.experts.83.gate_proj", "model.layers.61.mlp.experts.84.gate_proj", "model.layers.61.mlp.experts.85.gate_proj", "model.layers.61.mlp.experts.86.gate_proj", "model.layers.61.mlp.experts.87.gate_proj", "model.layers.61.mlp.experts.88.gate_proj", "model.layers.61.mlp.experts.89.gate_proj", "model.layers.61.mlp.experts.90.gate_proj", "model.layers.61.mlp.experts.91.gate_proj", "model.layers.61.mlp.experts.92.gate_proj", "model.layers.61.mlp.experts.93.gate_proj", "model.layers.61.mlp.experts.94.gate_proj", "model.layers.61.mlp.experts.95.gate_proj", "model.layers.61.mlp.experts.96.gate_proj", "model.layers.61.mlp.experts.97.gate_proj", "model.layers.61.mlp.experts.98.gate_proj", "model.layers.61.mlp.experts.99.gate_proj", "model.layers.61.mlp.experts.100.gate_proj", "model.layers.61.mlp.experts.101.gate_proj", "model.layers.61.mlp.experts.102.gate_proj", "model.layers.61.mlp.experts.103.gate_proj", "model.layers.61.mlp.experts.104.gate_proj", "model.layers.61.mlp.experts.105.gate_proj", "model.layers.61.mlp.experts.106.gate_proj", "model.layers.61.mlp.experts.107.gate_proj", "model.layers.61.mlp.experts.108.gate_proj", "model.layers.61.mlp.experts.109.gate_proj", "model.layers.61.mlp.experts.110.gate_proj", "model.layers.61.mlp.experts.111.gate_proj", "model.layers.61.mlp.experts.112.gate_proj", "model.layers.61.mlp.experts.113.gate_proj", "model.layers.61.mlp.experts.114.gate_proj", "model.layers.61.mlp.experts.115.gate_proj", "model.layers.61.mlp.experts.116.gate_proj", "model.layers.61.mlp.experts.117.gate_proj", "model.layers.61.mlp.experts.118.gate_proj", "model.layers.61.mlp.experts.119.gate_proj", "model.layers.61.mlp.experts.120.gate_proj", "model.layers.61.mlp.experts.121.gate_proj", "model.layers.61.mlp.experts.122.gate_proj", "model.layers.61.mlp.experts.123.gate_proj", "model.layers.61.mlp.experts.124.gate_proj", "model.layers.61.mlp.experts.125.gate_proj", "model.layers.61.mlp.experts.126.gate_proj", "model.layers.61.mlp.experts.127.gate_proj", "model.layers.61.mlp.experts.128.gate_proj", "model.layers.61.mlp.experts.129.gate_proj", "model.layers.61.mlp.experts.130.gate_proj", "model.layers.61.mlp.experts.131.gate_proj", "model.layers.61.mlp.experts.132.gate_proj", "model.layers.61.mlp.experts.133.gate_proj", "model.layers.61.mlp.experts.134.gate_proj", "model.layers.61.mlp.experts.135.gate_proj", "model.layers.61.mlp.experts.136.gate_proj", "model.layers.61.mlp.experts.137.gate_proj", "model.layers.61.mlp.experts.138.gate_proj", "model.layers.61.mlp.experts.139.gate_proj", "model.layers.61.mlp.experts.140.gate_proj", "model.layers.61.mlp.experts.141.gate_proj", "model.layers.61.mlp.experts.142.gate_proj", "model.layers.61.mlp.experts.143.gate_proj", "model.layers.61.mlp.experts.144.gate_proj", "model.layers.61.mlp.experts.145.gate_proj", "model.layers.61.mlp.experts.146.gate_proj", "model.layers.61.mlp.experts.147.gate_proj", "model.layers.61.mlp.experts.148.gate_proj", "model.layers.61.mlp.experts.149.gate_proj", "model.layers.61.mlp.experts.150.gate_proj", "model.layers.61.mlp.experts.151.gate_proj", "model.layers.61.mlp.experts.152.gate_proj", "model.layers.61.mlp.experts.153.gate_proj", "model.layers.61.mlp.experts.154.gate_proj", "model.layers.61.mlp.experts.155.gate_proj", "model.layers.61.mlp.experts.156.gate_proj", "model.layers.61.mlp.experts.157.gate_proj", "model.layers.61.mlp.experts.158.gate_proj", "model.layers.61.mlp.experts.159.gate_proj", "model.layers.61.mlp.experts.0.up_proj", "model.layers.61.mlp.experts.1.up_proj", "model.layers.61.mlp.experts.2.up_proj", "model.layers.61.mlp.experts.3.up_proj", "model.layers.61.mlp.experts.4.up_proj", "model.layers.61.mlp.experts.5.up_proj", "model.layers.61.mlp.experts.6.up_proj", "model.layers.61.mlp.experts.7.up_proj", "model.layers.61.mlp.experts.8.up_proj", "model.layers.61.mlp.experts.9.up_proj", "model.layers.61.mlp.experts.10.up_proj", "model.layers.61.mlp.experts.11.up_proj", "model.layers.61.mlp.experts.12.up_proj", "model.layers.61.mlp.experts.13.up_proj", "model.layers.61.mlp.experts.14.up_proj", "model.layers.61.mlp.experts.15.up_proj", "model.layers.61.mlp.experts.16.up_proj", "model.layers.61.mlp.experts.17.up_proj", "model.layers.61.mlp.experts.18.up_proj", "model.layers.61.mlp.experts.19.up_proj", "model.layers.61.mlp.experts.20.up_proj", "model.layers.61.mlp.experts.21.up_proj", "model.layers.61.mlp.experts.22.up_proj", "model.layers.61.mlp.experts.23.up_proj", "model.layers.61.mlp.experts.24.up_proj", "model.layers.61.mlp.experts.25.up_proj", "model.layers.61.mlp.experts.26.up_proj", "model.layers.61.mlp.experts.27.up_proj", "model.layers.61.mlp.experts.28.up_proj", "model.layers.61.mlp.experts.29.up_proj", "model.layers.61.mlp.experts.30.up_proj", "model.layers.61.mlp.experts.31.up_proj", "model.layers.61.mlp.experts.32.up_proj", "model.layers.61.mlp.experts.33.up_proj", "model.layers.61.mlp.experts.34.up_proj", "model.layers.61.mlp.experts.35.up_proj", "model.layers.61.mlp.experts.36.up_proj", "model.layers.61.mlp.experts.37.up_proj", "model.layers.61.mlp.experts.38.up_proj", "model.layers.61.mlp.experts.39.up_proj", "model.layers.61.mlp.experts.40.up_proj", "model.layers.61.mlp.experts.41.up_proj", "model.layers.61.mlp.experts.42.up_proj", "model.layers.61.mlp.experts.43.up_proj", "model.layers.61.mlp.experts.44.up_proj", "model.layers.61.mlp.experts.45.up_proj", "model.layers.61.mlp.experts.46.up_proj", "model.layers.61.mlp.experts.47.up_proj", "model.layers.61.mlp.experts.48.up_proj", "model.layers.61.mlp.experts.49.up_proj", "model.layers.61.mlp.experts.50.up_proj", "model.layers.61.mlp.experts.51.up_proj", "model.layers.61.mlp.experts.52.up_proj", "model.layers.61.mlp.experts.53.up_proj", "model.layers.61.mlp.experts.54.up_proj", "model.layers.61.mlp.experts.55.up_proj", "model.layers.61.mlp.experts.56.up_proj", "model.layers.61.mlp.experts.57.up_proj", "model.layers.61.mlp.experts.58.up_proj", "model.layers.61.mlp.experts.59.up_proj", "model.layers.61.mlp.experts.60.up_proj", "model.layers.61.mlp.experts.61.up_proj", "model.layers.61.mlp.experts.62.up_proj", "model.layers.61.mlp.experts.63.up_proj", "model.layers.61.mlp.experts.64.up_proj", "model.layers.61.mlp.experts.65.up_proj", "model.layers.61.mlp.experts.66.up_proj", "model.layers.61.mlp.experts.67.up_proj", "model.layers.61.mlp.experts.68.up_proj", "model.layers.61.mlp.experts.69.up_proj", "model.layers.61.mlp.experts.70.up_proj", "model.layers.61.mlp.experts.71.up_proj", "model.layers.61.mlp.experts.72.up_proj", "model.layers.61.mlp.experts.73.up_proj", "model.layers.61.mlp.experts.74.up_proj", "model.layers.61.mlp.experts.75.up_proj", "model.layers.61.mlp.experts.76.up_proj", "model.layers.61.mlp.experts.77.up_proj", "model.layers.61.mlp.experts.78.up_proj", "model.layers.61.mlp.experts.79.up_proj", "model.layers.61.mlp.experts.80.up_proj", "model.layers.61.mlp.experts.81.up_proj", "model.layers.61.mlp.experts.82.up_proj", "model.layers.61.mlp.experts.83.up_proj", "model.layers.61.mlp.experts.84.up_proj", "model.layers.61.mlp.experts.85.up_proj", "model.layers.61.mlp.experts.86.up_proj", "model.layers.61.mlp.experts.87.up_proj", "model.layers.61.mlp.experts.88.up_proj", "model.layers.61.mlp.experts.89.up_proj", "model.layers.61.mlp.experts.90.up_proj", "model.layers.61.mlp.experts.91.up_proj", "model.layers.61.mlp.experts.92.up_proj", "model.layers.61.mlp.experts.93.up_proj", "model.layers.61.mlp.experts.94.up_proj", "model.layers.61.mlp.experts.95.up_proj", "model.layers.61.mlp.experts.96.up_proj", "model.layers.61.mlp.experts.97.up_proj", "model.layers.61.mlp.experts.98.up_proj", "model.layers.61.mlp.experts.99.up_proj", "model.layers.61.mlp.experts.100.up_proj", "model.layers.61.mlp.experts.101.up_proj", "model.layers.61.mlp.experts.102.up_proj", "model.layers.61.mlp.experts.103.up_proj", "model.layers.61.mlp.experts.104.up_proj", "model.layers.61.mlp.experts.105.up_proj", "model.layers.61.mlp.experts.106.up_proj", "model.layers.61.mlp.experts.107.up_proj", "model.layers.61.mlp.experts.108.up_proj", "model.layers.61.mlp.experts.109.up_proj", "model.layers.61.mlp.experts.110.up_proj", "model.layers.61.mlp.experts.111.up_proj", "model.layers.61.mlp.experts.112.up_proj", "model.layers.61.mlp.experts.113.up_proj", "model.layers.61.mlp.experts.114.up_proj", "model.layers.61.mlp.experts.115.up_proj", "model.layers.61.mlp.experts.116.up_proj", "model.layers.61.mlp.experts.117.up_proj", "model.layers.61.mlp.experts.118.up_proj", "model.layers.61.mlp.experts.119.up_proj", "model.layers.61.mlp.experts.120.up_proj", "model.layers.61.mlp.experts.121.up_proj", "model.layers.61.mlp.experts.122.up_proj", "model.layers.61.mlp.experts.123.up_proj", "model.layers.61.mlp.experts.124.up_proj", "model.layers.61.mlp.experts.125.up_proj", "model.layers.61.mlp.experts.126.up_proj", "model.layers.61.mlp.experts.127.up_proj", "model.layers.61.mlp.experts.128.up_proj", "model.layers.61.mlp.experts.129.up_proj", "model.layers.61.mlp.experts.130.up_proj", "model.layers.61.mlp.experts.131.up_proj", "model.layers.61.mlp.experts.132.up_proj", "model.layers.61.mlp.experts.133.up_proj", "model.layers.61.mlp.experts.134.up_proj", "model.layers.61.mlp.experts.135.up_proj", "model.layers.61.mlp.experts.136.up_proj", "model.layers.61.mlp.experts.137.up_proj", "model.layers.61.mlp.experts.138.up_proj", "model.layers.61.mlp.experts.139.up_proj", "model.layers.61.mlp.experts.140.up_proj", "model.layers.61.mlp.experts.141.up_proj", "model.layers.61.mlp.experts.142.up_proj", "model.layers.61.mlp.experts.143.up_proj", "model.layers.61.mlp.experts.144.up_proj", "model.layers.61.mlp.experts.145.up_proj", "model.layers.61.mlp.experts.146.up_proj", "model.layers.61.mlp.experts.147.up_proj", "model.layers.61.mlp.experts.148.up_proj", "model.layers.61.mlp.experts.149.up_proj", "model.layers.61.mlp.experts.150.up_proj", "model.layers.61.mlp.experts.151.up_proj", "model.layers.61.mlp.experts.152.up_proj", "model.layers.61.mlp.experts.153.up_proj", "model.layers.61.mlp.experts.154.up_proj", "model.layers.61.mlp.experts.155.up_proj", "model.layers.61.mlp.experts.156.up_proj", "model.layers.61.mlp.experts.157.up_proj", "model.layers.61.mlp.experts.158.up_proj", "model.layers.61.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.8388172611592812e-05, "dbits": 2516582400 }, { "dkld": -2.5239353999494465e-05, "dbits": 5033164800 } ] }, { "idx": 368, "layers": [ "model.layers.61.mlp.experts.0.down_proj", "model.layers.61.mlp.experts.1.down_proj", "model.layers.61.mlp.experts.2.down_proj", "model.layers.61.mlp.experts.3.down_proj", "model.layers.61.mlp.experts.4.down_proj", "model.layers.61.mlp.experts.5.down_proj", "model.layers.61.mlp.experts.6.down_proj", "model.layers.61.mlp.experts.7.down_proj", "model.layers.61.mlp.experts.8.down_proj", "model.layers.61.mlp.experts.9.down_proj", "model.layers.61.mlp.experts.10.down_proj", "model.layers.61.mlp.experts.11.down_proj", "model.layers.61.mlp.experts.12.down_proj", "model.layers.61.mlp.experts.13.down_proj", "model.layers.61.mlp.experts.14.down_proj", "model.layers.61.mlp.experts.15.down_proj", "model.layers.61.mlp.experts.16.down_proj", "model.layers.61.mlp.experts.17.down_proj", "model.layers.61.mlp.experts.18.down_proj", "model.layers.61.mlp.experts.19.down_proj", "model.layers.61.mlp.experts.20.down_proj", "model.layers.61.mlp.experts.21.down_proj", "model.layers.61.mlp.experts.22.down_proj", "model.layers.61.mlp.experts.23.down_proj", "model.layers.61.mlp.experts.24.down_proj", "model.layers.61.mlp.experts.25.down_proj", "model.layers.61.mlp.experts.26.down_proj", "model.layers.61.mlp.experts.27.down_proj", "model.layers.61.mlp.experts.28.down_proj", "model.layers.61.mlp.experts.29.down_proj", "model.layers.61.mlp.experts.30.down_proj", "model.layers.61.mlp.experts.31.down_proj", "model.layers.61.mlp.experts.32.down_proj", "model.layers.61.mlp.experts.33.down_proj", "model.layers.61.mlp.experts.34.down_proj", "model.layers.61.mlp.experts.35.down_proj", "model.layers.61.mlp.experts.36.down_proj", "model.layers.61.mlp.experts.37.down_proj", "model.layers.61.mlp.experts.38.down_proj", "model.layers.61.mlp.experts.39.down_proj", "model.layers.61.mlp.experts.40.down_proj", "model.layers.61.mlp.experts.41.down_proj", "model.layers.61.mlp.experts.42.down_proj", "model.layers.61.mlp.experts.43.down_proj", "model.layers.61.mlp.experts.44.down_proj", "model.layers.61.mlp.experts.45.down_proj", "model.layers.61.mlp.experts.46.down_proj", "model.layers.61.mlp.experts.47.down_proj", "model.layers.61.mlp.experts.48.down_proj", "model.layers.61.mlp.experts.49.down_proj", "model.layers.61.mlp.experts.50.down_proj", "model.layers.61.mlp.experts.51.down_proj", "model.layers.61.mlp.experts.52.down_proj", "model.layers.61.mlp.experts.53.down_proj", "model.layers.61.mlp.experts.54.down_proj", "model.layers.61.mlp.experts.55.down_proj", "model.layers.61.mlp.experts.56.down_proj", "model.layers.61.mlp.experts.57.down_proj", "model.layers.61.mlp.experts.58.down_proj", "model.layers.61.mlp.experts.59.down_proj", "model.layers.61.mlp.experts.60.down_proj", "model.layers.61.mlp.experts.61.down_proj", "model.layers.61.mlp.experts.62.down_proj", "model.layers.61.mlp.experts.63.down_proj", "model.layers.61.mlp.experts.64.down_proj", "model.layers.61.mlp.experts.65.down_proj", "model.layers.61.mlp.experts.66.down_proj", "model.layers.61.mlp.experts.67.down_proj", "model.layers.61.mlp.experts.68.down_proj", "model.layers.61.mlp.experts.69.down_proj", "model.layers.61.mlp.experts.70.down_proj", "model.layers.61.mlp.experts.71.down_proj", "model.layers.61.mlp.experts.72.down_proj", "model.layers.61.mlp.experts.73.down_proj", "model.layers.61.mlp.experts.74.down_proj", "model.layers.61.mlp.experts.75.down_proj", "model.layers.61.mlp.experts.76.down_proj", "model.layers.61.mlp.experts.77.down_proj", "model.layers.61.mlp.experts.78.down_proj", "model.layers.61.mlp.experts.79.down_proj", "model.layers.61.mlp.experts.80.down_proj", "model.layers.61.mlp.experts.81.down_proj", "model.layers.61.mlp.experts.82.down_proj", "model.layers.61.mlp.experts.83.down_proj", "model.layers.61.mlp.experts.84.down_proj", "model.layers.61.mlp.experts.85.down_proj", "model.layers.61.mlp.experts.86.down_proj", "model.layers.61.mlp.experts.87.down_proj", "model.layers.61.mlp.experts.88.down_proj", "model.layers.61.mlp.experts.89.down_proj", "model.layers.61.mlp.experts.90.down_proj", "model.layers.61.mlp.experts.91.down_proj", "model.layers.61.mlp.experts.92.down_proj", "model.layers.61.mlp.experts.93.down_proj", "model.layers.61.mlp.experts.94.down_proj", "model.layers.61.mlp.experts.95.down_proj", "model.layers.61.mlp.experts.96.down_proj", "model.layers.61.mlp.experts.97.down_proj", "model.layers.61.mlp.experts.98.down_proj", "model.layers.61.mlp.experts.99.down_proj", "model.layers.61.mlp.experts.100.down_proj", "model.layers.61.mlp.experts.101.down_proj", "model.layers.61.mlp.experts.102.down_proj", "model.layers.61.mlp.experts.103.down_proj", "model.layers.61.mlp.experts.104.down_proj", "model.layers.61.mlp.experts.105.down_proj", "model.layers.61.mlp.experts.106.down_proj", "model.layers.61.mlp.experts.107.down_proj", "model.layers.61.mlp.experts.108.down_proj", "model.layers.61.mlp.experts.109.down_proj", "model.layers.61.mlp.experts.110.down_proj", "model.layers.61.mlp.experts.111.down_proj", "model.layers.61.mlp.experts.112.down_proj", "model.layers.61.mlp.experts.113.down_proj", "model.layers.61.mlp.experts.114.down_proj", "model.layers.61.mlp.experts.115.down_proj", "model.layers.61.mlp.experts.116.down_proj", "model.layers.61.mlp.experts.117.down_proj", "model.layers.61.mlp.experts.118.down_proj", "model.layers.61.mlp.experts.119.down_proj", "model.layers.61.mlp.experts.120.down_proj", "model.layers.61.mlp.experts.121.down_proj", "model.layers.61.mlp.experts.122.down_proj", "model.layers.61.mlp.experts.123.down_proj", "model.layers.61.mlp.experts.124.down_proj", "model.layers.61.mlp.experts.125.down_proj", "model.layers.61.mlp.experts.126.down_proj", "model.layers.61.mlp.experts.127.down_proj", "model.layers.61.mlp.experts.128.down_proj", "model.layers.61.mlp.experts.129.down_proj", "model.layers.61.mlp.experts.130.down_proj", "model.layers.61.mlp.experts.131.down_proj", "model.layers.61.mlp.experts.132.down_proj", "model.layers.61.mlp.experts.133.down_proj", "model.layers.61.mlp.experts.134.down_proj", "model.layers.61.mlp.experts.135.down_proj", "model.layers.61.mlp.experts.136.down_proj", "model.layers.61.mlp.experts.137.down_proj", "model.layers.61.mlp.experts.138.down_proj", "model.layers.61.mlp.experts.139.down_proj", "model.layers.61.mlp.experts.140.down_proj", "model.layers.61.mlp.experts.141.down_proj", "model.layers.61.mlp.experts.142.down_proj", "model.layers.61.mlp.experts.143.down_proj", "model.layers.61.mlp.experts.144.down_proj", "model.layers.61.mlp.experts.145.down_proj", "model.layers.61.mlp.experts.146.down_proj", "model.layers.61.mlp.experts.147.down_proj", "model.layers.61.mlp.experts.148.down_proj", "model.layers.61.mlp.experts.149.down_proj", "model.layers.61.mlp.experts.150.down_proj", "model.layers.61.mlp.experts.151.down_proj", "model.layers.61.mlp.experts.152.down_proj", "model.layers.61.mlp.experts.153.down_proj", "model.layers.61.mlp.experts.154.down_proj", "model.layers.61.mlp.experts.155.down_proj", "model.layers.61.mlp.experts.156.down_proj", "model.layers.61.mlp.experts.157.down_proj", "model.layers.61.mlp.experts.158.down_proj", "model.layers.61.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 2.2685993462801327e-05, "dbits": 1258291200 }, { "dkld": -1.175017096102099e-05, "dbits": 2516582400 } ] }, { "idx": 369, "layers": [ "model.layers.62.self_attn.q_proj" ], "candidates": [ { "dkld": 1.2194691225887386e-05, "dbits": 62914560 }, { "dkld": 7.986230775714268e-06, "dbits": 125829120 } ] }, { "idx": 370, "layers": [ "model.layers.62.self_attn.k_proj", "model.layers.62.self_attn.v_proj" ], "candidates": [ { "dkld": 1.6305176541209915e-05, "dbits": 10485760 }, { "dkld": 2.3268605582417445e-05, "dbits": 20971520 } ] }, { "idx": 371, "layers": [ "model.layers.62.self_attn.o_proj" ], "candidates": [ { "dkld": 1.366329379379888e-05, "dbits": 62914560 }, { "dkld": 1.1901394464075912e-05, "dbits": 125829120 } ] }, { "idx": 372, "layers": [ "model.layers.62.mlp.shared_experts.gate_proj", "model.layers.62.mlp.shared_experts.up_proj", "model.layers.62.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 1.5560863539577918e-05, "dbits": 23592960 }, { "dkld": -9.924033656716e-06, "dbits": 47185920 } ] }, { "idx": 373, "layers": [ "model.layers.62.mlp.experts.0.gate_proj", "model.layers.62.mlp.experts.1.gate_proj", "model.layers.62.mlp.experts.2.gate_proj", "model.layers.62.mlp.experts.3.gate_proj", "model.layers.62.mlp.experts.4.gate_proj", "model.layers.62.mlp.experts.5.gate_proj", "model.layers.62.mlp.experts.6.gate_proj", "model.layers.62.mlp.experts.7.gate_proj", "model.layers.62.mlp.experts.8.gate_proj", "model.layers.62.mlp.experts.9.gate_proj", "model.layers.62.mlp.experts.10.gate_proj", "model.layers.62.mlp.experts.11.gate_proj", "model.layers.62.mlp.experts.12.gate_proj", "model.layers.62.mlp.experts.13.gate_proj", "model.layers.62.mlp.experts.14.gate_proj", "model.layers.62.mlp.experts.15.gate_proj", "model.layers.62.mlp.experts.16.gate_proj", "model.layers.62.mlp.experts.17.gate_proj", "model.layers.62.mlp.experts.18.gate_proj", "model.layers.62.mlp.experts.19.gate_proj", "model.layers.62.mlp.experts.20.gate_proj", "model.layers.62.mlp.experts.21.gate_proj", "model.layers.62.mlp.experts.22.gate_proj", "model.layers.62.mlp.experts.23.gate_proj", "model.layers.62.mlp.experts.24.gate_proj", "model.layers.62.mlp.experts.25.gate_proj", "model.layers.62.mlp.experts.26.gate_proj", "model.layers.62.mlp.experts.27.gate_proj", "model.layers.62.mlp.experts.28.gate_proj", "model.layers.62.mlp.experts.29.gate_proj", "model.layers.62.mlp.experts.30.gate_proj", "model.layers.62.mlp.experts.31.gate_proj", "model.layers.62.mlp.experts.32.gate_proj", "model.layers.62.mlp.experts.33.gate_proj", "model.layers.62.mlp.experts.34.gate_proj", "model.layers.62.mlp.experts.35.gate_proj", "model.layers.62.mlp.experts.36.gate_proj", "model.layers.62.mlp.experts.37.gate_proj", "model.layers.62.mlp.experts.38.gate_proj", "model.layers.62.mlp.experts.39.gate_proj", "model.layers.62.mlp.experts.40.gate_proj", "model.layers.62.mlp.experts.41.gate_proj", "model.layers.62.mlp.experts.42.gate_proj", "model.layers.62.mlp.experts.43.gate_proj", "model.layers.62.mlp.experts.44.gate_proj", "model.layers.62.mlp.experts.45.gate_proj", "model.layers.62.mlp.experts.46.gate_proj", "model.layers.62.mlp.experts.47.gate_proj", "model.layers.62.mlp.experts.48.gate_proj", "model.layers.62.mlp.experts.49.gate_proj", "model.layers.62.mlp.experts.50.gate_proj", "model.layers.62.mlp.experts.51.gate_proj", "model.layers.62.mlp.experts.52.gate_proj", "model.layers.62.mlp.experts.53.gate_proj", "model.layers.62.mlp.experts.54.gate_proj", "model.layers.62.mlp.experts.55.gate_proj", "model.layers.62.mlp.experts.56.gate_proj", "model.layers.62.mlp.experts.57.gate_proj", "model.layers.62.mlp.experts.58.gate_proj", "model.layers.62.mlp.experts.59.gate_proj", "model.layers.62.mlp.experts.60.gate_proj", "model.layers.62.mlp.experts.61.gate_proj", "model.layers.62.mlp.experts.62.gate_proj", "model.layers.62.mlp.experts.63.gate_proj", "model.layers.62.mlp.experts.64.gate_proj", "model.layers.62.mlp.experts.65.gate_proj", "model.layers.62.mlp.experts.66.gate_proj", "model.layers.62.mlp.experts.67.gate_proj", "model.layers.62.mlp.experts.68.gate_proj", "model.layers.62.mlp.experts.69.gate_proj", "model.layers.62.mlp.experts.70.gate_proj", "model.layers.62.mlp.experts.71.gate_proj", "model.layers.62.mlp.experts.72.gate_proj", "model.layers.62.mlp.experts.73.gate_proj", "model.layers.62.mlp.experts.74.gate_proj", "model.layers.62.mlp.experts.75.gate_proj", "model.layers.62.mlp.experts.76.gate_proj", "model.layers.62.mlp.experts.77.gate_proj", "model.layers.62.mlp.experts.78.gate_proj", "model.layers.62.mlp.experts.79.gate_proj", "model.layers.62.mlp.experts.80.gate_proj", "model.layers.62.mlp.experts.81.gate_proj", "model.layers.62.mlp.experts.82.gate_proj", "model.layers.62.mlp.experts.83.gate_proj", "model.layers.62.mlp.experts.84.gate_proj", "model.layers.62.mlp.experts.85.gate_proj", "model.layers.62.mlp.experts.86.gate_proj", "model.layers.62.mlp.experts.87.gate_proj", "model.layers.62.mlp.experts.88.gate_proj", "model.layers.62.mlp.experts.89.gate_proj", "model.layers.62.mlp.experts.90.gate_proj", "model.layers.62.mlp.experts.91.gate_proj", "model.layers.62.mlp.experts.92.gate_proj", "model.layers.62.mlp.experts.93.gate_proj", "model.layers.62.mlp.experts.94.gate_proj", "model.layers.62.mlp.experts.95.gate_proj", "model.layers.62.mlp.experts.96.gate_proj", "model.layers.62.mlp.experts.97.gate_proj", "model.layers.62.mlp.experts.98.gate_proj", "model.layers.62.mlp.experts.99.gate_proj", "model.layers.62.mlp.experts.100.gate_proj", "model.layers.62.mlp.experts.101.gate_proj", "model.layers.62.mlp.experts.102.gate_proj", "model.layers.62.mlp.experts.103.gate_proj", "model.layers.62.mlp.experts.104.gate_proj", "model.layers.62.mlp.experts.105.gate_proj", "model.layers.62.mlp.experts.106.gate_proj", "model.layers.62.mlp.experts.107.gate_proj", "model.layers.62.mlp.experts.108.gate_proj", "model.layers.62.mlp.experts.109.gate_proj", "model.layers.62.mlp.experts.110.gate_proj", "model.layers.62.mlp.experts.111.gate_proj", "model.layers.62.mlp.experts.112.gate_proj", "model.layers.62.mlp.experts.113.gate_proj", "model.layers.62.mlp.experts.114.gate_proj", "model.layers.62.mlp.experts.115.gate_proj", "model.layers.62.mlp.experts.116.gate_proj", "model.layers.62.mlp.experts.117.gate_proj", "model.layers.62.mlp.experts.118.gate_proj", "model.layers.62.mlp.experts.119.gate_proj", "model.layers.62.mlp.experts.120.gate_proj", "model.layers.62.mlp.experts.121.gate_proj", "model.layers.62.mlp.experts.122.gate_proj", "model.layers.62.mlp.experts.123.gate_proj", "model.layers.62.mlp.experts.124.gate_proj", "model.layers.62.mlp.experts.125.gate_proj", "model.layers.62.mlp.experts.126.gate_proj", "model.layers.62.mlp.experts.127.gate_proj", "model.layers.62.mlp.experts.128.gate_proj", "model.layers.62.mlp.experts.129.gate_proj", "model.layers.62.mlp.experts.130.gate_proj", "model.layers.62.mlp.experts.131.gate_proj", "model.layers.62.mlp.experts.132.gate_proj", "model.layers.62.mlp.experts.133.gate_proj", "model.layers.62.mlp.experts.134.gate_proj", "model.layers.62.mlp.experts.135.gate_proj", "model.layers.62.mlp.experts.136.gate_proj", "model.layers.62.mlp.experts.137.gate_proj", "model.layers.62.mlp.experts.138.gate_proj", "model.layers.62.mlp.experts.139.gate_proj", "model.layers.62.mlp.experts.140.gate_proj", "model.layers.62.mlp.experts.141.gate_proj", "model.layers.62.mlp.experts.142.gate_proj", "model.layers.62.mlp.experts.143.gate_proj", "model.layers.62.mlp.experts.144.gate_proj", "model.layers.62.mlp.experts.145.gate_proj", "model.layers.62.mlp.experts.146.gate_proj", "model.layers.62.mlp.experts.147.gate_proj", "model.layers.62.mlp.experts.148.gate_proj", "model.layers.62.mlp.experts.149.gate_proj", "model.layers.62.mlp.experts.150.gate_proj", "model.layers.62.mlp.experts.151.gate_proj", "model.layers.62.mlp.experts.152.gate_proj", "model.layers.62.mlp.experts.153.gate_proj", "model.layers.62.mlp.experts.154.gate_proj", "model.layers.62.mlp.experts.155.gate_proj", "model.layers.62.mlp.experts.156.gate_proj", "model.layers.62.mlp.experts.157.gate_proj", "model.layers.62.mlp.experts.158.gate_proj", "model.layers.62.mlp.experts.159.gate_proj", "model.layers.62.mlp.experts.0.up_proj", "model.layers.62.mlp.experts.1.up_proj", "model.layers.62.mlp.experts.2.up_proj", "model.layers.62.mlp.experts.3.up_proj", "model.layers.62.mlp.experts.4.up_proj", "model.layers.62.mlp.experts.5.up_proj", "model.layers.62.mlp.experts.6.up_proj", "model.layers.62.mlp.experts.7.up_proj", "model.layers.62.mlp.experts.8.up_proj", "model.layers.62.mlp.experts.9.up_proj", "model.layers.62.mlp.experts.10.up_proj", "model.layers.62.mlp.experts.11.up_proj", "model.layers.62.mlp.experts.12.up_proj", "model.layers.62.mlp.experts.13.up_proj", "model.layers.62.mlp.experts.14.up_proj", "model.layers.62.mlp.experts.15.up_proj", "model.layers.62.mlp.experts.16.up_proj", "model.layers.62.mlp.experts.17.up_proj", "model.layers.62.mlp.experts.18.up_proj", "model.layers.62.mlp.experts.19.up_proj", "model.layers.62.mlp.experts.20.up_proj", "model.layers.62.mlp.experts.21.up_proj", "model.layers.62.mlp.experts.22.up_proj", "model.layers.62.mlp.experts.23.up_proj", "model.layers.62.mlp.experts.24.up_proj", "model.layers.62.mlp.experts.25.up_proj", "model.layers.62.mlp.experts.26.up_proj", "model.layers.62.mlp.experts.27.up_proj", "model.layers.62.mlp.experts.28.up_proj", "model.layers.62.mlp.experts.29.up_proj", "model.layers.62.mlp.experts.30.up_proj", "model.layers.62.mlp.experts.31.up_proj", "model.layers.62.mlp.experts.32.up_proj", "model.layers.62.mlp.experts.33.up_proj", "model.layers.62.mlp.experts.34.up_proj", "model.layers.62.mlp.experts.35.up_proj", "model.layers.62.mlp.experts.36.up_proj", "model.layers.62.mlp.experts.37.up_proj", "model.layers.62.mlp.experts.38.up_proj", "model.layers.62.mlp.experts.39.up_proj", "model.layers.62.mlp.experts.40.up_proj", "model.layers.62.mlp.experts.41.up_proj", "model.layers.62.mlp.experts.42.up_proj", "model.layers.62.mlp.experts.43.up_proj", "model.layers.62.mlp.experts.44.up_proj", "model.layers.62.mlp.experts.45.up_proj", "model.layers.62.mlp.experts.46.up_proj", "model.layers.62.mlp.experts.47.up_proj", "model.layers.62.mlp.experts.48.up_proj", "model.layers.62.mlp.experts.49.up_proj", "model.layers.62.mlp.experts.50.up_proj", "model.layers.62.mlp.experts.51.up_proj", "model.layers.62.mlp.experts.52.up_proj", "model.layers.62.mlp.experts.53.up_proj", "model.layers.62.mlp.experts.54.up_proj", "model.layers.62.mlp.experts.55.up_proj", "model.layers.62.mlp.experts.56.up_proj", "model.layers.62.mlp.experts.57.up_proj", "model.layers.62.mlp.experts.58.up_proj", "model.layers.62.mlp.experts.59.up_proj", "model.layers.62.mlp.experts.60.up_proj", "model.layers.62.mlp.experts.61.up_proj", "model.layers.62.mlp.experts.62.up_proj", "model.layers.62.mlp.experts.63.up_proj", "model.layers.62.mlp.experts.64.up_proj", "model.layers.62.mlp.experts.65.up_proj", "model.layers.62.mlp.experts.66.up_proj", "model.layers.62.mlp.experts.67.up_proj", "model.layers.62.mlp.experts.68.up_proj", "model.layers.62.mlp.experts.69.up_proj", "model.layers.62.mlp.experts.70.up_proj", "model.layers.62.mlp.experts.71.up_proj", "model.layers.62.mlp.experts.72.up_proj", "model.layers.62.mlp.experts.73.up_proj", "model.layers.62.mlp.experts.74.up_proj", "model.layers.62.mlp.experts.75.up_proj", "model.layers.62.mlp.experts.76.up_proj", "model.layers.62.mlp.experts.77.up_proj", "model.layers.62.mlp.experts.78.up_proj", "model.layers.62.mlp.experts.79.up_proj", "model.layers.62.mlp.experts.80.up_proj", "model.layers.62.mlp.experts.81.up_proj", "model.layers.62.mlp.experts.82.up_proj", "model.layers.62.mlp.experts.83.up_proj", "model.layers.62.mlp.experts.84.up_proj", "model.layers.62.mlp.experts.85.up_proj", "model.layers.62.mlp.experts.86.up_proj", "model.layers.62.mlp.experts.87.up_proj", "model.layers.62.mlp.experts.88.up_proj", "model.layers.62.mlp.experts.89.up_proj", "model.layers.62.mlp.experts.90.up_proj", "model.layers.62.mlp.experts.91.up_proj", "model.layers.62.mlp.experts.92.up_proj", "model.layers.62.mlp.experts.93.up_proj", "model.layers.62.mlp.experts.94.up_proj", "model.layers.62.mlp.experts.95.up_proj", "model.layers.62.mlp.experts.96.up_proj", "model.layers.62.mlp.experts.97.up_proj", "model.layers.62.mlp.experts.98.up_proj", "model.layers.62.mlp.experts.99.up_proj", "model.layers.62.mlp.experts.100.up_proj", "model.layers.62.mlp.experts.101.up_proj", "model.layers.62.mlp.experts.102.up_proj", "model.layers.62.mlp.experts.103.up_proj", "model.layers.62.mlp.experts.104.up_proj", "model.layers.62.mlp.experts.105.up_proj", "model.layers.62.mlp.experts.106.up_proj", "model.layers.62.mlp.experts.107.up_proj", "model.layers.62.mlp.experts.108.up_proj", "model.layers.62.mlp.experts.109.up_proj", "model.layers.62.mlp.experts.110.up_proj", "model.layers.62.mlp.experts.111.up_proj", "model.layers.62.mlp.experts.112.up_proj", "model.layers.62.mlp.experts.113.up_proj", "model.layers.62.mlp.experts.114.up_proj", "model.layers.62.mlp.experts.115.up_proj", "model.layers.62.mlp.experts.116.up_proj", "model.layers.62.mlp.experts.117.up_proj", "model.layers.62.mlp.experts.118.up_proj", "model.layers.62.mlp.experts.119.up_proj", "model.layers.62.mlp.experts.120.up_proj", "model.layers.62.mlp.experts.121.up_proj", "model.layers.62.mlp.experts.122.up_proj", "model.layers.62.mlp.experts.123.up_proj", "model.layers.62.mlp.experts.124.up_proj", "model.layers.62.mlp.experts.125.up_proj", "model.layers.62.mlp.experts.126.up_proj", "model.layers.62.mlp.experts.127.up_proj", "model.layers.62.mlp.experts.128.up_proj", "model.layers.62.mlp.experts.129.up_proj", "model.layers.62.mlp.experts.130.up_proj", "model.layers.62.mlp.experts.131.up_proj", "model.layers.62.mlp.experts.132.up_proj", "model.layers.62.mlp.experts.133.up_proj", "model.layers.62.mlp.experts.134.up_proj", "model.layers.62.mlp.experts.135.up_proj", "model.layers.62.mlp.experts.136.up_proj", "model.layers.62.mlp.experts.137.up_proj", "model.layers.62.mlp.experts.138.up_proj", "model.layers.62.mlp.experts.139.up_proj", "model.layers.62.mlp.experts.140.up_proj", "model.layers.62.mlp.experts.141.up_proj", "model.layers.62.mlp.experts.142.up_proj", "model.layers.62.mlp.experts.143.up_proj", "model.layers.62.mlp.experts.144.up_proj", "model.layers.62.mlp.experts.145.up_proj", "model.layers.62.mlp.experts.146.up_proj", "model.layers.62.mlp.experts.147.up_proj", "model.layers.62.mlp.experts.148.up_proj", "model.layers.62.mlp.experts.149.up_proj", "model.layers.62.mlp.experts.150.up_proj", "model.layers.62.mlp.experts.151.up_proj", "model.layers.62.mlp.experts.152.up_proj", "model.layers.62.mlp.experts.153.up_proj", "model.layers.62.mlp.experts.154.up_proj", "model.layers.62.mlp.experts.155.up_proj", "model.layers.62.mlp.experts.156.up_proj", "model.layers.62.mlp.experts.157.up_proj", "model.layers.62.mlp.experts.158.up_proj", "model.layers.62.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -6.578257307409893e-06, "dbits": 2516582400 }, { "dkld": -9.3223992735144e-06, "dbits": 5033164800 } ] }, { "idx": 374, "layers": [ "model.layers.62.mlp.experts.0.down_proj", "model.layers.62.mlp.experts.1.down_proj", "model.layers.62.mlp.experts.2.down_proj", "model.layers.62.mlp.experts.3.down_proj", "model.layers.62.mlp.experts.4.down_proj", "model.layers.62.mlp.experts.5.down_proj", "model.layers.62.mlp.experts.6.down_proj", "model.layers.62.mlp.experts.7.down_proj", "model.layers.62.mlp.experts.8.down_proj", "model.layers.62.mlp.experts.9.down_proj", "model.layers.62.mlp.experts.10.down_proj", "model.layers.62.mlp.experts.11.down_proj", "model.layers.62.mlp.experts.12.down_proj", "model.layers.62.mlp.experts.13.down_proj", "model.layers.62.mlp.experts.14.down_proj", "model.layers.62.mlp.experts.15.down_proj", "model.layers.62.mlp.experts.16.down_proj", "model.layers.62.mlp.experts.17.down_proj", "model.layers.62.mlp.experts.18.down_proj", "model.layers.62.mlp.experts.19.down_proj", "model.layers.62.mlp.experts.20.down_proj", "model.layers.62.mlp.experts.21.down_proj", "model.layers.62.mlp.experts.22.down_proj", "model.layers.62.mlp.experts.23.down_proj", "model.layers.62.mlp.experts.24.down_proj", "model.layers.62.mlp.experts.25.down_proj", "model.layers.62.mlp.experts.26.down_proj", "model.layers.62.mlp.experts.27.down_proj", "model.layers.62.mlp.experts.28.down_proj", "model.layers.62.mlp.experts.29.down_proj", "model.layers.62.mlp.experts.30.down_proj", "model.layers.62.mlp.experts.31.down_proj", "model.layers.62.mlp.experts.32.down_proj", "model.layers.62.mlp.experts.33.down_proj", "model.layers.62.mlp.experts.34.down_proj", "model.layers.62.mlp.experts.35.down_proj", "model.layers.62.mlp.experts.36.down_proj", "model.layers.62.mlp.experts.37.down_proj", "model.layers.62.mlp.experts.38.down_proj", "model.layers.62.mlp.experts.39.down_proj", "model.layers.62.mlp.experts.40.down_proj", "model.layers.62.mlp.experts.41.down_proj", "model.layers.62.mlp.experts.42.down_proj", "model.layers.62.mlp.experts.43.down_proj", "model.layers.62.mlp.experts.44.down_proj", "model.layers.62.mlp.experts.45.down_proj", "model.layers.62.mlp.experts.46.down_proj", "model.layers.62.mlp.experts.47.down_proj", "model.layers.62.mlp.experts.48.down_proj", "model.layers.62.mlp.experts.49.down_proj", "model.layers.62.mlp.experts.50.down_proj", "model.layers.62.mlp.experts.51.down_proj", "model.layers.62.mlp.experts.52.down_proj", "model.layers.62.mlp.experts.53.down_proj", "model.layers.62.mlp.experts.54.down_proj", "model.layers.62.mlp.experts.55.down_proj", "model.layers.62.mlp.experts.56.down_proj", "model.layers.62.mlp.experts.57.down_proj", "model.layers.62.mlp.experts.58.down_proj", "model.layers.62.mlp.experts.59.down_proj", "model.layers.62.mlp.experts.60.down_proj", "model.layers.62.mlp.experts.61.down_proj", "model.layers.62.mlp.experts.62.down_proj", "model.layers.62.mlp.experts.63.down_proj", "model.layers.62.mlp.experts.64.down_proj", "model.layers.62.mlp.experts.65.down_proj", "model.layers.62.mlp.experts.66.down_proj", "model.layers.62.mlp.experts.67.down_proj", "model.layers.62.mlp.experts.68.down_proj", "model.layers.62.mlp.experts.69.down_proj", "model.layers.62.mlp.experts.70.down_proj", "model.layers.62.mlp.experts.71.down_proj", "model.layers.62.mlp.experts.72.down_proj", "model.layers.62.mlp.experts.73.down_proj", "model.layers.62.mlp.experts.74.down_proj", "model.layers.62.mlp.experts.75.down_proj", "model.layers.62.mlp.experts.76.down_proj", "model.layers.62.mlp.experts.77.down_proj", "model.layers.62.mlp.experts.78.down_proj", "model.layers.62.mlp.experts.79.down_proj", "model.layers.62.mlp.experts.80.down_proj", "model.layers.62.mlp.experts.81.down_proj", "model.layers.62.mlp.experts.82.down_proj", "model.layers.62.mlp.experts.83.down_proj", "model.layers.62.mlp.experts.84.down_proj", "model.layers.62.mlp.experts.85.down_proj", "model.layers.62.mlp.experts.86.down_proj", "model.layers.62.mlp.experts.87.down_proj", "model.layers.62.mlp.experts.88.down_proj", "model.layers.62.mlp.experts.89.down_proj", "model.layers.62.mlp.experts.90.down_proj", "model.layers.62.mlp.experts.91.down_proj", "model.layers.62.mlp.experts.92.down_proj", "model.layers.62.mlp.experts.93.down_proj", "model.layers.62.mlp.experts.94.down_proj", "model.layers.62.mlp.experts.95.down_proj", "model.layers.62.mlp.experts.96.down_proj", "model.layers.62.mlp.experts.97.down_proj", "model.layers.62.mlp.experts.98.down_proj", "model.layers.62.mlp.experts.99.down_proj", "model.layers.62.mlp.experts.100.down_proj", "model.layers.62.mlp.experts.101.down_proj", "model.layers.62.mlp.experts.102.down_proj", "model.layers.62.mlp.experts.103.down_proj", "model.layers.62.mlp.experts.104.down_proj", "model.layers.62.mlp.experts.105.down_proj", "model.layers.62.mlp.experts.106.down_proj", "model.layers.62.mlp.experts.107.down_proj", "model.layers.62.mlp.experts.108.down_proj", "model.layers.62.mlp.experts.109.down_proj", "model.layers.62.mlp.experts.110.down_proj", "model.layers.62.mlp.experts.111.down_proj", "model.layers.62.mlp.experts.112.down_proj", "model.layers.62.mlp.experts.113.down_proj", "model.layers.62.mlp.experts.114.down_proj", "model.layers.62.mlp.experts.115.down_proj", "model.layers.62.mlp.experts.116.down_proj", "model.layers.62.mlp.experts.117.down_proj", "model.layers.62.mlp.experts.118.down_proj", "model.layers.62.mlp.experts.119.down_proj", "model.layers.62.mlp.experts.120.down_proj", "model.layers.62.mlp.experts.121.down_proj", "model.layers.62.mlp.experts.122.down_proj", "model.layers.62.mlp.experts.123.down_proj", "model.layers.62.mlp.experts.124.down_proj", "model.layers.62.mlp.experts.125.down_proj", "model.layers.62.mlp.experts.126.down_proj", "model.layers.62.mlp.experts.127.down_proj", "model.layers.62.mlp.experts.128.down_proj", "model.layers.62.mlp.experts.129.down_proj", "model.layers.62.mlp.experts.130.down_proj", "model.layers.62.mlp.experts.131.down_proj", "model.layers.62.mlp.experts.132.down_proj", "model.layers.62.mlp.experts.133.down_proj", "model.layers.62.mlp.experts.134.down_proj", "model.layers.62.mlp.experts.135.down_proj", "model.layers.62.mlp.experts.136.down_proj", "model.layers.62.mlp.experts.137.down_proj", "model.layers.62.mlp.experts.138.down_proj", "model.layers.62.mlp.experts.139.down_proj", "model.layers.62.mlp.experts.140.down_proj", "model.layers.62.mlp.experts.141.down_proj", "model.layers.62.mlp.experts.142.down_proj", "model.layers.62.mlp.experts.143.down_proj", "model.layers.62.mlp.experts.144.down_proj", "model.layers.62.mlp.experts.145.down_proj", "model.layers.62.mlp.experts.146.down_proj", "model.layers.62.mlp.experts.147.down_proj", "model.layers.62.mlp.experts.148.down_proj", "model.layers.62.mlp.experts.149.down_proj", "model.layers.62.mlp.experts.150.down_proj", "model.layers.62.mlp.experts.151.down_proj", "model.layers.62.mlp.experts.152.down_proj", "model.layers.62.mlp.experts.153.down_proj", "model.layers.62.mlp.experts.154.down_proj", "model.layers.62.mlp.experts.155.down_proj", "model.layers.62.mlp.experts.156.down_proj", "model.layers.62.mlp.experts.157.down_proj", "model.layers.62.mlp.experts.158.down_proj", "model.layers.62.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 4.4882064685232426e-06, "dbits": 1258291200 }, { "dkld": -8.428096771239887e-06, "dbits": 2516582400 } ] }, { "idx": 375, "layers": [ "model.layers.63.self_attn.q_proj" ], "candidates": [ { "dkld": -2.4276273325084946e-05, "dbits": 62914560 }, { "dkld": -2.9981136322021484e-05, "dbits": 125829120 } ] }, { "idx": 376, "layers": [ "model.layers.63.self_attn.k_proj", "model.layers.63.self_attn.v_proj" ], "candidates": [ { "dkld": 7.1432674303654325e-06, "dbits": 10485760 }, { "dkld": -1.85605138540261e-05, "dbits": 20971520 } ] }, { "idx": 377, "layers": [ "model.layers.63.self_attn.o_proj" ], "candidates": [ { "dkld": 8.52497760206461e-06, "dbits": 62914560 }, { "dkld": 1.3514072634279728e-05, "dbits": 125829120 } ] }, { "idx": 378, "layers": [ "model.layers.63.mlp.shared_experts.gate_proj", "model.layers.63.mlp.shared_experts.up_proj", "model.layers.63.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -1.6815774142741116e-05, "dbits": 23592960 }, { "dkld": -4.3596606701598595e-06, "dbits": 47185920 } ] }, { "idx": 379, "layers": [ "model.layers.63.mlp.experts.0.gate_proj", "model.layers.63.mlp.experts.1.gate_proj", "model.layers.63.mlp.experts.2.gate_proj", "model.layers.63.mlp.experts.3.gate_proj", "model.layers.63.mlp.experts.4.gate_proj", "model.layers.63.mlp.experts.5.gate_proj", "model.layers.63.mlp.experts.6.gate_proj", "model.layers.63.mlp.experts.7.gate_proj", "model.layers.63.mlp.experts.8.gate_proj", "model.layers.63.mlp.experts.9.gate_proj", "model.layers.63.mlp.experts.10.gate_proj", "model.layers.63.mlp.experts.11.gate_proj", "model.layers.63.mlp.experts.12.gate_proj", "model.layers.63.mlp.experts.13.gate_proj", "model.layers.63.mlp.experts.14.gate_proj", "model.layers.63.mlp.experts.15.gate_proj", "model.layers.63.mlp.experts.16.gate_proj", "model.layers.63.mlp.experts.17.gate_proj", "model.layers.63.mlp.experts.18.gate_proj", "model.layers.63.mlp.experts.19.gate_proj", "model.layers.63.mlp.experts.20.gate_proj", "model.layers.63.mlp.experts.21.gate_proj", "model.layers.63.mlp.experts.22.gate_proj", "model.layers.63.mlp.experts.23.gate_proj", "model.layers.63.mlp.experts.24.gate_proj", "model.layers.63.mlp.experts.25.gate_proj", "model.layers.63.mlp.experts.26.gate_proj", "model.layers.63.mlp.experts.27.gate_proj", "model.layers.63.mlp.experts.28.gate_proj", "model.layers.63.mlp.experts.29.gate_proj", "model.layers.63.mlp.experts.30.gate_proj", "model.layers.63.mlp.experts.31.gate_proj", "model.layers.63.mlp.experts.32.gate_proj", "model.layers.63.mlp.experts.33.gate_proj", "model.layers.63.mlp.experts.34.gate_proj", "model.layers.63.mlp.experts.35.gate_proj", "model.layers.63.mlp.experts.36.gate_proj", "model.layers.63.mlp.experts.37.gate_proj", "model.layers.63.mlp.experts.38.gate_proj", "model.layers.63.mlp.experts.39.gate_proj", "model.layers.63.mlp.experts.40.gate_proj", "model.layers.63.mlp.experts.41.gate_proj", "model.layers.63.mlp.experts.42.gate_proj", "model.layers.63.mlp.experts.43.gate_proj", "model.layers.63.mlp.experts.44.gate_proj", "model.layers.63.mlp.experts.45.gate_proj", "model.layers.63.mlp.experts.46.gate_proj", "model.layers.63.mlp.experts.47.gate_proj", "model.layers.63.mlp.experts.48.gate_proj", "model.layers.63.mlp.experts.49.gate_proj", "model.layers.63.mlp.experts.50.gate_proj", "model.layers.63.mlp.experts.51.gate_proj", "model.layers.63.mlp.experts.52.gate_proj", "model.layers.63.mlp.experts.53.gate_proj", "model.layers.63.mlp.experts.54.gate_proj", "model.layers.63.mlp.experts.55.gate_proj", "model.layers.63.mlp.experts.56.gate_proj", "model.layers.63.mlp.experts.57.gate_proj", "model.layers.63.mlp.experts.58.gate_proj", "model.layers.63.mlp.experts.59.gate_proj", "model.layers.63.mlp.experts.60.gate_proj", "model.layers.63.mlp.experts.61.gate_proj", "model.layers.63.mlp.experts.62.gate_proj", "model.layers.63.mlp.experts.63.gate_proj", "model.layers.63.mlp.experts.64.gate_proj", "model.layers.63.mlp.experts.65.gate_proj", "model.layers.63.mlp.experts.66.gate_proj", "model.layers.63.mlp.experts.67.gate_proj", "model.layers.63.mlp.experts.68.gate_proj", "model.layers.63.mlp.experts.69.gate_proj", "model.layers.63.mlp.experts.70.gate_proj", "model.layers.63.mlp.experts.71.gate_proj", "model.layers.63.mlp.experts.72.gate_proj", "model.layers.63.mlp.experts.73.gate_proj", "model.layers.63.mlp.experts.74.gate_proj", "model.layers.63.mlp.experts.75.gate_proj", "model.layers.63.mlp.experts.76.gate_proj", "model.layers.63.mlp.experts.77.gate_proj", "model.layers.63.mlp.experts.78.gate_proj", "model.layers.63.mlp.experts.79.gate_proj", "model.layers.63.mlp.experts.80.gate_proj", "model.layers.63.mlp.experts.81.gate_proj", "model.layers.63.mlp.experts.82.gate_proj", "model.layers.63.mlp.experts.83.gate_proj", "model.layers.63.mlp.experts.84.gate_proj", "model.layers.63.mlp.experts.85.gate_proj", "model.layers.63.mlp.experts.86.gate_proj", "model.layers.63.mlp.experts.87.gate_proj", "model.layers.63.mlp.experts.88.gate_proj", "model.layers.63.mlp.experts.89.gate_proj", "model.layers.63.mlp.experts.90.gate_proj", "model.layers.63.mlp.experts.91.gate_proj", "model.layers.63.mlp.experts.92.gate_proj", "model.layers.63.mlp.experts.93.gate_proj", "model.layers.63.mlp.experts.94.gate_proj", "model.layers.63.mlp.experts.95.gate_proj", "model.layers.63.mlp.experts.96.gate_proj", "model.layers.63.mlp.experts.97.gate_proj", "model.layers.63.mlp.experts.98.gate_proj", "model.layers.63.mlp.experts.99.gate_proj", "model.layers.63.mlp.experts.100.gate_proj", "model.layers.63.mlp.experts.101.gate_proj", "model.layers.63.mlp.experts.102.gate_proj", "model.layers.63.mlp.experts.103.gate_proj", "model.layers.63.mlp.experts.104.gate_proj", "model.layers.63.mlp.experts.105.gate_proj", "model.layers.63.mlp.experts.106.gate_proj", "model.layers.63.mlp.experts.107.gate_proj", "model.layers.63.mlp.experts.108.gate_proj", "model.layers.63.mlp.experts.109.gate_proj", "model.layers.63.mlp.experts.110.gate_proj", "model.layers.63.mlp.experts.111.gate_proj", "model.layers.63.mlp.experts.112.gate_proj", "model.layers.63.mlp.experts.113.gate_proj", "model.layers.63.mlp.experts.114.gate_proj", "model.layers.63.mlp.experts.115.gate_proj", "model.layers.63.mlp.experts.116.gate_proj", "model.layers.63.mlp.experts.117.gate_proj", "model.layers.63.mlp.experts.118.gate_proj", "model.layers.63.mlp.experts.119.gate_proj", "model.layers.63.mlp.experts.120.gate_proj", "model.layers.63.mlp.experts.121.gate_proj", "model.layers.63.mlp.experts.122.gate_proj", "model.layers.63.mlp.experts.123.gate_proj", "model.layers.63.mlp.experts.124.gate_proj", "model.layers.63.mlp.experts.125.gate_proj", "model.layers.63.mlp.experts.126.gate_proj", "model.layers.63.mlp.experts.127.gate_proj", "model.layers.63.mlp.experts.128.gate_proj", "model.layers.63.mlp.experts.129.gate_proj", "model.layers.63.mlp.experts.130.gate_proj", "model.layers.63.mlp.experts.131.gate_proj", "model.layers.63.mlp.experts.132.gate_proj", "model.layers.63.mlp.experts.133.gate_proj", "model.layers.63.mlp.experts.134.gate_proj", "model.layers.63.mlp.experts.135.gate_proj", "model.layers.63.mlp.experts.136.gate_proj", "model.layers.63.mlp.experts.137.gate_proj", "model.layers.63.mlp.experts.138.gate_proj", "model.layers.63.mlp.experts.139.gate_proj", "model.layers.63.mlp.experts.140.gate_proj", "model.layers.63.mlp.experts.141.gate_proj", "model.layers.63.mlp.experts.142.gate_proj", "model.layers.63.mlp.experts.143.gate_proj", "model.layers.63.mlp.experts.144.gate_proj", "model.layers.63.mlp.experts.145.gate_proj", "model.layers.63.mlp.experts.146.gate_proj", "model.layers.63.mlp.experts.147.gate_proj", "model.layers.63.mlp.experts.148.gate_proj", "model.layers.63.mlp.experts.149.gate_proj", "model.layers.63.mlp.experts.150.gate_proj", "model.layers.63.mlp.experts.151.gate_proj", "model.layers.63.mlp.experts.152.gate_proj", "model.layers.63.mlp.experts.153.gate_proj", "model.layers.63.mlp.experts.154.gate_proj", "model.layers.63.mlp.experts.155.gate_proj", "model.layers.63.mlp.experts.156.gate_proj", "model.layers.63.mlp.experts.157.gate_proj", "model.layers.63.mlp.experts.158.gate_proj", "model.layers.63.mlp.experts.159.gate_proj", "model.layers.63.mlp.experts.0.up_proj", "model.layers.63.mlp.experts.1.up_proj", "model.layers.63.mlp.experts.2.up_proj", "model.layers.63.mlp.experts.3.up_proj", "model.layers.63.mlp.experts.4.up_proj", "model.layers.63.mlp.experts.5.up_proj", "model.layers.63.mlp.experts.6.up_proj", "model.layers.63.mlp.experts.7.up_proj", "model.layers.63.mlp.experts.8.up_proj", "model.layers.63.mlp.experts.9.up_proj", "model.layers.63.mlp.experts.10.up_proj", "model.layers.63.mlp.experts.11.up_proj", "model.layers.63.mlp.experts.12.up_proj", "model.layers.63.mlp.experts.13.up_proj", "model.layers.63.mlp.experts.14.up_proj", "model.layers.63.mlp.experts.15.up_proj", "model.layers.63.mlp.experts.16.up_proj", "model.layers.63.mlp.experts.17.up_proj", "model.layers.63.mlp.experts.18.up_proj", "model.layers.63.mlp.experts.19.up_proj", "model.layers.63.mlp.experts.20.up_proj", "model.layers.63.mlp.experts.21.up_proj", "model.layers.63.mlp.experts.22.up_proj", "model.layers.63.mlp.experts.23.up_proj", "model.layers.63.mlp.experts.24.up_proj", "model.layers.63.mlp.experts.25.up_proj", "model.layers.63.mlp.experts.26.up_proj", "model.layers.63.mlp.experts.27.up_proj", "model.layers.63.mlp.experts.28.up_proj", "model.layers.63.mlp.experts.29.up_proj", "model.layers.63.mlp.experts.30.up_proj", "model.layers.63.mlp.experts.31.up_proj", "model.layers.63.mlp.experts.32.up_proj", "model.layers.63.mlp.experts.33.up_proj", "model.layers.63.mlp.experts.34.up_proj", "model.layers.63.mlp.experts.35.up_proj", "model.layers.63.mlp.experts.36.up_proj", "model.layers.63.mlp.experts.37.up_proj", "model.layers.63.mlp.experts.38.up_proj", "model.layers.63.mlp.experts.39.up_proj", "model.layers.63.mlp.experts.40.up_proj", "model.layers.63.mlp.experts.41.up_proj", "model.layers.63.mlp.experts.42.up_proj", "model.layers.63.mlp.experts.43.up_proj", "model.layers.63.mlp.experts.44.up_proj", "model.layers.63.mlp.experts.45.up_proj", "model.layers.63.mlp.experts.46.up_proj", "model.layers.63.mlp.experts.47.up_proj", "model.layers.63.mlp.experts.48.up_proj", "model.layers.63.mlp.experts.49.up_proj", "model.layers.63.mlp.experts.50.up_proj", "model.layers.63.mlp.experts.51.up_proj", "model.layers.63.mlp.experts.52.up_proj", "model.layers.63.mlp.experts.53.up_proj", "model.layers.63.mlp.experts.54.up_proj", "model.layers.63.mlp.experts.55.up_proj", "model.layers.63.mlp.experts.56.up_proj", "model.layers.63.mlp.experts.57.up_proj", "model.layers.63.mlp.experts.58.up_proj", "model.layers.63.mlp.experts.59.up_proj", "model.layers.63.mlp.experts.60.up_proj", "model.layers.63.mlp.experts.61.up_proj", "model.layers.63.mlp.experts.62.up_proj", "model.layers.63.mlp.experts.63.up_proj", "model.layers.63.mlp.experts.64.up_proj", "model.layers.63.mlp.experts.65.up_proj", "model.layers.63.mlp.experts.66.up_proj", "model.layers.63.mlp.experts.67.up_proj", "model.layers.63.mlp.experts.68.up_proj", "model.layers.63.mlp.experts.69.up_proj", "model.layers.63.mlp.experts.70.up_proj", "model.layers.63.mlp.experts.71.up_proj", "model.layers.63.mlp.experts.72.up_proj", "model.layers.63.mlp.experts.73.up_proj", "model.layers.63.mlp.experts.74.up_proj", "model.layers.63.mlp.experts.75.up_proj", "model.layers.63.mlp.experts.76.up_proj", "model.layers.63.mlp.experts.77.up_proj", "model.layers.63.mlp.experts.78.up_proj", "model.layers.63.mlp.experts.79.up_proj", "model.layers.63.mlp.experts.80.up_proj", "model.layers.63.mlp.experts.81.up_proj", "model.layers.63.mlp.experts.82.up_proj", "model.layers.63.mlp.experts.83.up_proj", "model.layers.63.mlp.experts.84.up_proj", "model.layers.63.mlp.experts.85.up_proj", "model.layers.63.mlp.experts.86.up_proj", "model.layers.63.mlp.experts.87.up_proj", "model.layers.63.mlp.experts.88.up_proj", "model.layers.63.mlp.experts.89.up_proj", "model.layers.63.mlp.experts.90.up_proj", "model.layers.63.mlp.experts.91.up_proj", "model.layers.63.mlp.experts.92.up_proj", "model.layers.63.mlp.experts.93.up_proj", "model.layers.63.mlp.experts.94.up_proj", "model.layers.63.mlp.experts.95.up_proj", "model.layers.63.mlp.experts.96.up_proj", "model.layers.63.mlp.experts.97.up_proj", "model.layers.63.mlp.experts.98.up_proj", "model.layers.63.mlp.experts.99.up_proj", "model.layers.63.mlp.experts.100.up_proj", "model.layers.63.mlp.experts.101.up_proj", "model.layers.63.mlp.experts.102.up_proj", "model.layers.63.mlp.experts.103.up_proj", "model.layers.63.mlp.experts.104.up_proj", "model.layers.63.mlp.experts.105.up_proj", "model.layers.63.mlp.experts.106.up_proj", "model.layers.63.mlp.experts.107.up_proj", "model.layers.63.mlp.experts.108.up_proj", "model.layers.63.mlp.experts.109.up_proj", "model.layers.63.mlp.experts.110.up_proj", "model.layers.63.mlp.experts.111.up_proj", "model.layers.63.mlp.experts.112.up_proj", "model.layers.63.mlp.experts.113.up_proj", "model.layers.63.mlp.experts.114.up_proj", "model.layers.63.mlp.experts.115.up_proj", "model.layers.63.mlp.experts.116.up_proj", "model.layers.63.mlp.experts.117.up_proj", "model.layers.63.mlp.experts.118.up_proj", "model.layers.63.mlp.experts.119.up_proj", "model.layers.63.mlp.experts.120.up_proj", "model.layers.63.mlp.experts.121.up_proj", "model.layers.63.mlp.experts.122.up_proj", "model.layers.63.mlp.experts.123.up_proj", "model.layers.63.mlp.experts.124.up_proj", "model.layers.63.mlp.experts.125.up_proj", "model.layers.63.mlp.experts.126.up_proj", "model.layers.63.mlp.experts.127.up_proj", "model.layers.63.mlp.experts.128.up_proj", "model.layers.63.mlp.experts.129.up_proj", "model.layers.63.mlp.experts.130.up_proj", "model.layers.63.mlp.experts.131.up_proj", "model.layers.63.mlp.experts.132.up_proj", "model.layers.63.mlp.experts.133.up_proj", "model.layers.63.mlp.experts.134.up_proj", "model.layers.63.mlp.experts.135.up_proj", "model.layers.63.mlp.experts.136.up_proj", "model.layers.63.mlp.experts.137.up_proj", "model.layers.63.mlp.experts.138.up_proj", "model.layers.63.mlp.experts.139.up_proj", "model.layers.63.mlp.experts.140.up_proj", "model.layers.63.mlp.experts.141.up_proj", "model.layers.63.mlp.experts.142.up_proj", "model.layers.63.mlp.experts.143.up_proj", "model.layers.63.mlp.experts.144.up_proj", "model.layers.63.mlp.experts.145.up_proj", "model.layers.63.mlp.experts.146.up_proj", "model.layers.63.mlp.experts.147.up_proj", "model.layers.63.mlp.experts.148.up_proj", "model.layers.63.mlp.experts.149.up_proj", "model.layers.63.mlp.experts.150.up_proj", "model.layers.63.mlp.experts.151.up_proj", "model.layers.63.mlp.experts.152.up_proj", "model.layers.63.mlp.experts.153.up_proj", "model.layers.63.mlp.experts.154.up_proj", "model.layers.63.mlp.experts.155.up_proj", "model.layers.63.mlp.experts.156.up_proj", "model.layers.63.mlp.experts.157.up_proj", "model.layers.63.mlp.experts.158.up_proj", "model.layers.63.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.0766706913699232e-06, "dbits": 2516582400 }, { "dkld": -4.172697663305802e-06, "dbits": 5033164800 } ] }, { "idx": 380, "layers": [ "model.layers.63.mlp.experts.0.down_proj", "model.layers.63.mlp.experts.1.down_proj", "model.layers.63.mlp.experts.2.down_proj", "model.layers.63.mlp.experts.3.down_proj", "model.layers.63.mlp.experts.4.down_proj", "model.layers.63.mlp.experts.5.down_proj", "model.layers.63.mlp.experts.6.down_proj", "model.layers.63.mlp.experts.7.down_proj", "model.layers.63.mlp.experts.8.down_proj", "model.layers.63.mlp.experts.9.down_proj", "model.layers.63.mlp.experts.10.down_proj", "model.layers.63.mlp.experts.11.down_proj", "model.layers.63.mlp.experts.12.down_proj", "model.layers.63.mlp.experts.13.down_proj", "model.layers.63.mlp.experts.14.down_proj", "model.layers.63.mlp.experts.15.down_proj", "model.layers.63.mlp.experts.16.down_proj", "model.layers.63.mlp.experts.17.down_proj", "model.layers.63.mlp.experts.18.down_proj", "model.layers.63.mlp.experts.19.down_proj", "model.layers.63.mlp.experts.20.down_proj", "model.layers.63.mlp.experts.21.down_proj", "model.layers.63.mlp.experts.22.down_proj", "model.layers.63.mlp.experts.23.down_proj", "model.layers.63.mlp.experts.24.down_proj", "model.layers.63.mlp.experts.25.down_proj", "model.layers.63.mlp.experts.26.down_proj", "model.layers.63.mlp.experts.27.down_proj", "model.layers.63.mlp.experts.28.down_proj", "model.layers.63.mlp.experts.29.down_proj", "model.layers.63.mlp.experts.30.down_proj", "model.layers.63.mlp.experts.31.down_proj", "model.layers.63.mlp.experts.32.down_proj", "model.layers.63.mlp.experts.33.down_proj", "model.layers.63.mlp.experts.34.down_proj", "model.layers.63.mlp.experts.35.down_proj", "model.layers.63.mlp.experts.36.down_proj", "model.layers.63.mlp.experts.37.down_proj", "model.layers.63.mlp.experts.38.down_proj", "model.layers.63.mlp.experts.39.down_proj", "model.layers.63.mlp.experts.40.down_proj", "model.layers.63.mlp.experts.41.down_proj", "model.layers.63.mlp.experts.42.down_proj", "model.layers.63.mlp.experts.43.down_proj", "model.layers.63.mlp.experts.44.down_proj", "model.layers.63.mlp.experts.45.down_proj", "model.layers.63.mlp.experts.46.down_proj", "model.layers.63.mlp.experts.47.down_proj", "model.layers.63.mlp.experts.48.down_proj", "model.layers.63.mlp.experts.49.down_proj", "model.layers.63.mlp.experts.50.down_proj", "model.layers.63.mlp.experts.51.down_proj", "model.layers.63.mlp.experts.52.down_proj", "model.layers.63.mlp.experts.53.down_proj", "model.layers.63.mlp.experts.54.down_proj", "model.layers.63.mlp.experts.55.down_proj", "model.layers.63.mlp.experts.56.down_proj", "model.layers.63.mlp.experts.57.down_proj", "model.layers.63.mlp.experts.58.down_proj", "model.layers.63.mlp.experts.59.down_proj", "model.layers.63.mlp.experts.60.down_proj", "model.layers.63.mlp.experts.61.down_proj", "model.layers.63.mlp.experts.62.down_proj", "model.layers.63.mlp.experts.63.down_proj", "model.layers.63.mlp.experts.64.down_proj", "model.layers.63.mlp.experts.65.down_proj", "model.layers.63.mlp.experts.66.down_proj", "model.layers.63.mlp.experts.67.down_proj", "model.layers.63.mlp.experts.68.down_proj", "model.layers.63.mlp.experts.69.down_proj", "model.layers.63.mlp.experts.70.down_proj", "model.layers.63.mlp.experts.71.down_proj", "model.layers.63.mlp.experts.72.down_proj", "model.layers.63.mlp.experts.73.down_proj", "model.layers.63.mlp.experts.74.down_proj", "model.layers.63.mlp.experts.75.down_proj", "model.layers.63.mlp.experts.76.down_proj", "model.layers.63.mlp.experts.77.down_proj", "model.layers.63.mlp.experts.78.down_proj", "model.layers.63.mlp.experts.79.down_proj", "model.layers.63.mlp.experts.80.down_proj", "model.layers.63.mlp.experts.81.down_proj", "model.layers.63.mlp.experts.82.down_proj", "model.layers.63.mlp.experts.83.down_proj", "model.layers.63.mlp.experts.84.down_proj", "model.layers.63.mlp.experts.85.down_proj", "model.layers.63.mlp.experts.86.down_proj", "model.layers.63.mlp.experts.87.down_proj", "model.layers.63.mlp.experts.88.down_proj", "model.layers.63.mlp.experts.89.down_proj", "model.layers.63.mlp.experts.90.down_proj", "model.layers.63.mlp.experts.91.down_proj", "model.layers.63.mlp.experts.92.down_proj", "model.layers.63.mlp.experts.93.down_proj", "model.layers.63.mlp.experts.94.down_proj", "model.layers.63.mlp.experts.95.down_proj", "model.layers.63.mlp.experts.96.down_proj", "model.layers.63.mlp.experts.97.down_proj", "model.layers.63.mlp.experts.98.down_proj", "model.layers.63.mlp.experts.99.down_proj", "model.layers.63.mlp.experts.100.down_proj", "model.layers.63.mlp.experts.101.down_proj", "model.layers.63.mlp.experts.102.down_proj", "model.layers.63.mlp.experts.103.down_proj", "model.layers.63.mlp.experts.104.down_proj", "model.layers.63.mlp.experts.105.down_proj", "model.layers.63.mlp.experts.106.down_proj", "model.layers.63.mlp.experts.107.down_proj", "model.layers.63.mlp.experts.108.down_proj", "model.layers.63.mlp.experts.109.down_proj", "model.layers.63.mlp.experts.110.down_proj", "model.layers.63.mlp.experts.111.down_proj", "model.layers.63.mlp.experts.112.down_proj", "model.layers.63.mlp.experts.113.down_proj", "model.layers.63.mlp.experts.114.down_proj", "model.layers.63.mlp.experts.115.down_proj", "model.layers.63.mlp.experts.116.down_proj", "model.layers.63.mlp.experts.117.down_proj", "model.layers.63.mlp.experts.118.down_proj", "model.layers.63.mlp.experts.119.down_proj", "model.layers.63.mlp.experts.120.down_proj", "model.layers.63.mlp.experts.121.down_proj", "model.layers.63.mlp.experts.122.down_proj", "model.layers.63.mlp.experts.123.down_proj", "model.layers.63.mlp.experts.124.down_proj", "model.layers.63.mlp.experts.125.down_proj", "model.layers.63.mlp.experts.126.down_proj", "model.layers.63.mlp.experts.127.down_proj", "model.layers.63.mlp.experts.128.down_proj", "model.layers.63.mlp.experts.129.down_proj", "model.layers.63.mlp.experts.130.down_proj", "model.layers.63.mlp.experts.131.down_proj", "model.layers.63.mlp.experts.132.down_proj", "model.layers.63.mlp.experts.133.down_proj", "model.layers.63.mlp.experts.134.down_proj", "model.layers.63.mlp.experts.135.down_proj", "model.layers.63.mlp.experts.136.down_proj", "model.layers.63.mlp.experts.137.down_proj", "model.layers.63.mlp.experts.138.down_proj", "model.layers.63.mlp.experts.139.down_proj", "model.layers.63.mlp.experts.140.down_proj", "model.layers.63.mlp.experts.141.down_proj", "model.layers.63.mlp.experts.142.down_proj", "model.layers.63.mlp.experts.143.down_proj", "model.layers.63.mlp.experts.144.down_proj", "model.layers.63.mlp.experts.145.down_proj", "model.layers.63.mlp.experts.146.down_proj", "model.layers.63.mlp.experts.147.down_proj", "model.layers.63.mlp.experts.148.down_proj", "model.layers.63.mlp.experts.149.down_proj", "model.layers.63.mlp.experts.150.down_proj", "model.layers.63.mlp.experts.151.down_proj", "model.layers.63.mlp.experts.152.down_proj", "model.layers.63.mlp.experts.153.down_proj", "model.layers.63.mlp.experts.154.down_proj", "model.layers.63.mlp.experts.155.down_proj", "model.layers.63.mlp.experts.156.down_proj", "model.layers.63.mlp.experts.157.down_proj", "model.layers.63.mlp.experts.158.down_proj", "model.layers.63.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 1.7341063357890693e-05, "dbits": 1258291200 }, { "dkld": 2.4941610172392326e-05, "dbits": 2516582400 } ] }, { "idx": 381, "layers": [ "model.layers.64.self_attn.q_proj" ], "candidates": [ { "dkld": 1.897863112390076e-05, "dbits": 62914560 }, { "dkld": 8.069071918727355e-06, "dbits": 125829120 } ] }, { "idx": 382, "layers": [ "model.layers.64.self_attn.k_proj", "model.layers.64.self_attn.v_proj" ], "candidates": [ { "dkld": 1.4786329120398609e-05, "dbits": 10485760 }, { "dkld": 1.4506746083498001e-05, "dbits": 20971520 } ] }, { "idx": 383, "layers": [ "model.layers.64.self_attn.o_proj" ], "candidates": [ { "dkld": 7.700920104981163e-06, "dbits": 62914560 }, { "dkld": 4.500057548284878e-06, "dbits": 125829120 } ] }, { "idx": 384, "layers": [ "model.layers.64.mlp.shared_experts.gate_proj", "model.layers.64.mlp.shared_experts.up_proj", "model.layers.64.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -4.474772140380251e-07, "dbits": 23592960 }, { "dkld": -1.3676518574355992e-05, "dbits": 47185920 } ] }, { "idx": 385, "layers": [ "model.layers.64.mlp.experts.0.gate_proj", "model.layers.64.mlp.experts.1.gate_proj", "model.layers.64.mlp.experts.2.gate_proj", "model.layers.64.mlp.experts.3.gate_proj", "model.layers.64.mlp.experts.4.gate_proj", "model.layers.64.mlp.experts.5.gate_proj", "model.layers.64.mlp.experts.6.gate_proj", "model.layers.64.mlp.experts.7.gate_proj", "model.layers.64.mlp.experts.8.gate_proj", "model.layers.64.mlp.experts.9.gate_proj", "model.layers.64.mlp.experts.10.gate_proj", "model.layers.64.mlp.experts.11.gate_proj", "model.layers.64.mlp.experts.12.gate_proj", "model.layers.64.mlp.experts.13.gate_proj", "model.layers.64.mlp.experts.14.gate_proj", "model.layers.64.mlp.experts.15.gate_proj", "model.layers.64.mlp.experts.16.gate_proj", "model.layers.64.mlp.experts.17.gate_proj", "model.layers.64.mlp.experts.18.gate_proj", "model.layers.64.mlp.experts.19.gate_proj", "model.layers.64.mlp.experts.20.gate_proj", "model.layers.64.mlp.experts.21.gate_proj", "model.layers.64.mlp.experts.22.gate_proj", "model.layers.64.mlp.experts.23.gate_proj", "model.layers.64.mlp.experts.24.gate_proj", "model.layers.64.mlp.experts.25.gate_proj", "model.layers.64.mlp.experts.26.gate_proj", "model.layers.64.mlp.experts.27.gate_proj", "model.layers.64.mlp.experts.28.gate_proj", "model.layers.64.mlp.experts.29.gate_proj", "model.layers.64.mlp.experts.30.gate_proj", "model.layers.64.mlp.experts.31.gate_proj", "model.layers.64.mlp.experts.32.gate_proj", "model.layers.64.mlp.experts.33.gate_proj", "model.layers.64.mlp.experts.34.gate_proj", "model.layers.64.mlp.experts.35.gate_proj", "model.layers.64.mlp.experts.36.gate_proj", "model.layers.64.mlp.experts.37.gate_proj", "model.layers.64.mlp.experts.38.gate_proj", "model.layers.64.mlp.experts.39.gate_proj", "model.layers.64.mlp.experts.40.gate_proj", "model.layers.64.mlp.experts.41.gate_proj", "model.layers.64.mlp.experts.42.gate_proj", "model.layers.64.mlp.experts.43.gate_proj", "model.layers.64.mlp.experts.44.gate_proj", "model.layers.64.mlp.experts.45.gate_proj", "model.layers.64.mlp.experts.46.gate_proj", "model.layers.64.mlp.experts.47.gate_proj", "model.layers.64.mlp.experts.48.gate_proj", "model.layers.64.mlp.experts.49.gate_proj", "model.layers.64.mlp.experts.50.gate_proj", "model.layers.64.mlp.experts.51.gate_proj", "model.layers.64.mlp.experts.52.gate_proj", "model.layers.64.mlp.experts.53.gate_proj", "model.layers.64.mlp.experts.54.gate_proj", "model.layers.64.mlp.experts.55.gate_proj", "model.layers.64.mlp.experts.56.gate_proj", "model.layers.64.mlp.experts.57.gate_proj", "model.layers.64.mlp.experts.58.gate_proj", "model.layers.64.mlp.experts.59.gate_proj", "model.layers.64.mlp.experts.60.gate_proj", "model.layers.64.mlp.experts.61.gate_proj", "model.layers.64.mlp.experts.62.gate_proj", "model.layers.64.mlp.experts.63.gate_proj", "model.layers.64.mlp.experts.64.gate_proj", "model.layers.64.mlp.experts.65.gate_proj", "model.layers.64.mlp.experts.66.gate_proj", "model.layers.64.mlp.experts.67.gate_proj", "model.layers.64.mlp.experts.68.gate_proj", "model.layers.64.mlp.experts.69.gate_proj", "model.layers.64.mlp.experts.70.gate_proj", "model.layers.64.mlp.experts.71.gate_proj", "model.layers.64.mlp.experts.72.gate_proj", "model.layers.64.mlp.experts.73.gate_proj", "model.layers.64.mlp.experts.74.gate_proj", "model.layers.64.mlp.experts.75.gate_proj", "model.layers.64.mlp.experts.76.gate_proj", "model.layers.64.mlp.experts.77.gate_proj", "model.layers.64.mlp.experts.78.gate_proj", "model.layers.64.mlp.experts.79.gate_proj", "model.layers.64.mlp.experts.80.gate_proj", "model.layers.64.mlp.experts.81.gate_proj", "model.layers.64.mlp.experts.82.gate_proj", "model.layers.64.mlp.experts.83.gate_proj", "model.layers.64.mlp.experts.84.gate_proj", "model.layers.64.mlp.experts.85.gate_proj", "model.layers.64.mlp.experts.86.gate_proj", "model.layers.64.mlp.experts.87.gate_proj", "model.layers.64.mlp.experts.88.gate_proj", "model.layers.64.mlp.experts.89.gate_proj", "model.layers.64.mlp.experts.90.gate_proj", "model.layers.64.mlp.experts.91.gate_proj", "model.layers.64.mlp.experts.92.gate_proj", "model.layers.64.mlp.experts.93.gate_proj", "model.layers.64.mlp.experts.94.gate_proj", "model.layers.64.mlp.experts.95.gate_proj", "model.layers.64.mlp.experts.96.gate_proj", "model.layers.64.mlp.experts.97.gate_proj", "model.layers.64.mlp.experts.98.gate_proj", "model.layers.64.mlp.experts.99.gate_proj", "model.layers.64.mlp.experts.100.gate_proj", "model.layers.64.mlp.experts.101.gate_proj", "model.layers.64.mlp.experts.102.gate_proj", "model.layers.64.mlp.experts.103.gate_proj", "model.layers.64.mlp.experts.104.gate_proj", "model.layers.64.mlp.experts.105.gate_proj", "model.layers.64.mlp.experts.106.gate_proj", "model.layers.64.mlp.experts.107.gate_proj", "model.layers.64.mlp.experts.108.gate_proj", "model.layers.64.mlp.experts.109.gate_proj", "model.layers.64.mlp.experts.110.gate_proj", "model.layers.64.mlp.experts.111.gate_proj", "model.layers.64.mlp.experts.112.gate_proj", "model.layers.64.mlp.experts.113.gate_proj", "model.layers.64.mlp.experts.114.gate_proj", "model.layers.64.mlp.experts.115.gate_proj", "model.layers.64.mlp.experts.116.gate_proj", "model.layers.64.mlp.experts.117.gate_proj", "model.layers.64.mlp.experts.118.gate_proj", "model.layers.64.mlp.experts.119.gate_proj", "model.layers.64.mlp.experts.120.gate_proj", "model.layers.64.mlp.experts.121.gate_proj", "model.layers.64.mlp.experts.122.gate_proj", "model.layers.64.mlp.experts.123.gate_proj", "model.layers.64.mlp.experts.124.gate_proj", "model.layers.64.mlp.experts.125.gate_proj", "model.layers.64.mlp.experts.126.gate_proj", "model.layers.64.mlp.experts.127.gate_proj", "model.layers.64.mlp.experts.128.gate_proj", "model.layers.64.mlp.experts.129.gate_proj", "model.layers.64.mlp.experts.130.gate_proj", "model.layers.64.mlp.experts.131.gate_proj", "model.layers.64.mlp.experts.132.gate_proj", "model.layers.64.mlp.experts.133.gate_proj", "model.layers.64.mlp.experts.134.gate_proj", "model.layers.64.mlp.experts.135.gate_proj", "model.layers.64.mlp.experts.136.gate_proj", "model.layers.64.mlp.experts.137.gate_proj", "model.layers.64.mlp.experts.138.gate_proj", "model.layers.64.mlp.experts.139.gate_proj", "model.layers.64.mlp.experts.140.gate_proj", "model.layers.64.mlp.experts.141.gate_proj", "model.layers.64.mlp.experts.142.gate_proj", "model.layers.64.mlp.experts.143.gate_proj", "model.layers.64.mlp.experts.144.gate_proj", "model.layers.64.mlp.experts.145.gate_proj", "model.layers.64.mlp.experts.146.gate_proj", "model.layers.64.mlp.experts.147.gate_proj", "model.layers.64.mlp.experts.148.gate_proj", "model.layers.64.mlp.experts.149.gate_proj", "model.layers.64.mlp.experts.150.gate_proj", "model.layers.64.mlp.experts.151.gate_proj", "model.layers.64.mlp.experts.152.gate_proj", "model.layers.64.mlp.experts.153.gate_proj", "model.layers.64.mlp.experts.154.gate_proj", "model.layers.64.mlp.experts.155.gate_proj", "model.layers.64.mlp.experts.156.gate_proj", "model.layers.64.mlp.experts.157.gate_proj", "model.layers.64.mlp.experts.158.gate_proj", "model.layers.64.mlp.experts.159.gate_proj", "model.layers.64.mlp.experts.0.up_proj", "model.layers.64.mlp.experts.1.up_proj", "model.layers.64.mlp.experts.2.up_proj", "model.layers.64.mlp.experts.3.up_proj", "model.layers.64.mlp.experts.4.up_proj", "model.layers.64.mlp.experts.5.up_proj", "model.layers.64.mlp.experts.6.up_proj", "model.layers.64.mlp.experts.7.up_proj", "model.layers.64.mlp.experts.8.up_proj", "model.layers.64.mlp.experts.9.up_proj", "model.layers.64.mlp.experts.10.up_proj", "model.layers.64.mlp.experts.11.up_proj", "model.layers.64.mlp.experts.12.up_proj", "model.layers.64.mlp.experts.13.up_proj", "model.layers.64.mlp.experts.14.up_proj", "model.layers.64.mlp.experts.15.up_proj", "model.layers.64.mlp.experts.16.up_proj", "model.layers.64.mlp.experts.17.up_proj", "model.layers.64.mlp.experts.18.up_proj", "model.layers.64.mlp.experts.19.up_proj", "model.layers.64.mlp.experts.20.up_proj", "model.layers.64.mlp.experts.21.up_proj", "model.layers.64.mlp.experts.22.up_proj", "model.layers.64.mlp.experts.23.up_proj", "model.layers.64.mlp.experts.24.up_proj", "model.layers.64.mlp.experts.25.up_proj", "model.layers.64.mlp.experts.26.up_proj", "model.layers.64.mlp.experts.27.up_proj", "model.layers.64.mlp.experts.28.up_proj", "model.layers.64.mlp.experts.29.up_proj", "model.layers.64.mlp.experts.30.up_proj", "model.layers.64.mlp.experts.31.up_proj", "model.layers.64.mlp.experts.32.up_proj", "model.layers.64.mlp.experts.33.up_proj", "model.layers.64.mlp.experts.34.up_proj", "model.layers.64.mlp.experts.35.up_proj", "model.layers.64.mlp.experts.36.up_proj", "model.layers.64.mlp.experts.37.up_proj", "model.layers.64.mlp.experts.38.up_proj", "model.layers.64.mlp.experts.39.up_proj", "model.layers.64.mlp.experts.40.up_proj", "model.layers.64.mlp.experts.41.up_proj", "model.layers.64.mlp.experts.42.up_proj", "model.layers.64.mlp.experts.43.up_proj", "model.layers.64.mlp.experts.44.up_proj", "model.layers.64.mlp.experts.45.up_proj", "model.layers.64.mlp.experts.46.up_proj", "model.layers.64.mlp.experts.47.up_proj", "model.layers.64.mlp.experts.48.up_proj", "model.layers.64.mlp.experts.49.up_proj", "model.layers.64.mlp.experts.50.up_proj", "model.layers.64.mlp.experts.51.up_proj", "model.layers.64.mlp.experts.52.up_proj", "model.layers.64.mlp.experts.53.up_proj", "model.layers.64.mlp.experts.54.up_proj", "model.layers.64.mlp.experts.55.up_proj", "model.layers.64.mlp.experts.56.up_proj", "model.layers.64.mlp.experts.57.up_proj", "model.layers.64.mlp.experts.58.up_proj", "model.layers.64.mlp.experts.59.up_proj", "model.layers.64.mlp.experts.60.up_proj", "model.layers.64.mlp.experts.61.up_proj", "model.layers.64.mlp.experts.62.up_proj", "model.layers.64.mlp.experts.63.up_proj", "model.layers.64.mlp.experts.64.up_proj", "model.layers.64.mlp.experts.65.up_proj", "model.layers.64.mlp.experts.66.up_proj", "model.layers.64.mlp.experts.67.up_proj", "model.layers.64.mlp.experts.68.up_proj", "model.layers.64.mlp.experts.69.up_proj", "model.layers.64.mlp.experts.70.up_proj", "model.layers.64.mlp.experts.71.up_proj", "model.layers.64.mlp.experts.72.up_proj", "model.layers.64.mlp.experts.73.up_proj", "model.layers.64.mlp.experts.74.up_proj", "model.layers.64.mlp.experts.75.up_proj", "model.layers.64.mlp.experts.76.up_proj", "model.layers.64.mlp.experts.77.up_proj", "model.layers.64.mlp.experts.78.up_proj", "model.layers.64.mlp.experts.79.up_proj", "model.layers.64.mlp.experts.80.up_proj", "model.layers.64.mlp.experts.81.up_proj", "model.layers.64.mlp.experts.82.up_proj", "model.layers.64.mlp.experts.83.up_proj", "model.layers.64.mlp.experts.84.up_proj", "model.layers.64.mlp.experts.85.up_proj", "model.layers.64.mlp.experts.86.up_proj", "model.layers.64.mlp.experts.87.up_proj", "model.layers.64.mlp.experts.88.up_proj", "model.layers.64.mlp.experts.89.up_proj", "model.layers.64.mlp.experts.90.up_proj", "model.layers.64.mlp.experts.91.up_proj", "model.layers.64.mlp.experts.92.up_proj", "model.layers.64.mlp.experts.93.up_proj", "model.layers.64.mlp.experts.94.up_proj", "model.layers.64.mlp.experts.95.up_proj", "model.layers.64.mlp.experts.96.up_proj", "model.layers.64.mlp.experts.97.up_proj", "model.layers.64.mlp.experts.98.up_proj", "model.layers.64.mlp.experts.99.up_proj", "model.layers.64.mlp.experts.100.up_proj", "model.layers.64.mlp.experts.101.up_proj", "model.layers.64.mlp.experts.102.up_proj", "model.layers.64.mlp.experts.103.up_proj", "model.layers.64.mlp.experts.104.up_proj", "model.layers.64.mlp.experts.105.up_proj", "model.layers.64.mlp.experts.106.up_proj", "model.layers.64.mlp.experts.107.up_proj", "model.layers.64.mlp.experts.108.up_proj", "model.layers.64.mlp.experts.109.up_proj", "model.layers.64.mlp.experts.110.up_proj", "model.layers.64.mlp.experts.111.up_proj", "model.layers.64.mlp.experts.112.up_proj", "model.layers.64.mlp.experts.113.up_proj", "model.layers.64.mlp.experts.114.up_proj", "model.layers.64.mlp.experts.115.up_proj", "model.layers.64.mlp.experts.116.up_proj", "model.layers.64.mlp.experts.117.up_proj", "model.layers.64.mlp.experts.118.up_proj", "model.layers.64.mlp.experts.119.up_proj", "model.layers.64.mlp.experts.120.up_proj", "model.layers.64.mlp.experts.121.up_proj", "model.layers.64.mlp.experts.122.up_proj", "model.layers.64.mlp.experts.123.up_proj", "model.layers.64.mlp.experts.124.up_proj", "model.layers.64.mlp.experts.125.up_proj", "model.layers.64.mlp.experts.126.up_proj", "model.layers.64.mlp.experts.127.up_proj", "model.layers.64.mlp.experts.128.up_proj", "model.layers.64.mlp.experts.129.up_proj", "model.layers.64.mlp.experts.130.up_proj", "model.layers.64.mlp.experts.131.up_proj", "model.layers.64.mlp.experts.132.up_proj", "model.layers.64.mlp.experts.133.up_proj", "model.layers.64.mlp.experts.134.up_proj", "model.layers.64.mlp.experts.135.up_proj", "model.layers.64.mlp.experts.136.up_proj", "model.layers.64.mlp.experts.137.up_proj", "model.layers.64.mlp.experts.138.up_proj", "model.layers.64.mlp.experts.139.up_proj", "model.layers.64.mlp.experts.140.up_proj", "model.layers.64.mlp.experts.141.up_proj", "model.layers.64.mlp.experts.142.up_proj", "model.layers.64.mlp.experts.143.up_proj", "model.layers.64.mlp.experts.144.up_proj", "model.layers.64.mlp.experts.145.up_proj", "model.layers.64.mlp.experts.146.up_proj", "model.layers.64.mlp.experts.147.up_proj", "model.layers.64.mlp.experts.148.up_proj", "model.layers.64.mlp.experts.149.up_proj", "model.layers.64.mlp.experts.150.up_proj", "model.layers.64.mlp.experts.151.up_proj", "model.layers.64.mlp.experts.152.up_proj", "model.layers.64.mlp.experts.153.up_proj", "model.layers.64.mlp.experts.154.up_proj", "model.layers.64.mlp.experts.155.up_proj", "model.layers.64.mlp.experts.156.up_proj", "model.layers.64.mlp.experts.157.up_proj", "model.layers.64.mlp.experts.158.up_proj", "model.layers.64.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.1927600502967834e-05, "dbits": 2516582400 }, { "dkld": -2.4887104518710873e-05, "dbits": 5033164800 } ] }, { "idx": 386, "layers": [ "model.layers.64.mlp.experts.0.down_proj", "model.layers.64.mlp.experts.1.down_proj", "model.layers.64.mlp.experts.2.down_proj", "model.layers.64.mlp.experts.3.down_proj", "model.layers.64.mlp.experts.4.down_proj", "model.layers.64.mlp.experts.5.down_proj", "model.layers.64.mlp.experts.6.down_proj", "model.layers.64.mlp.experts.7.down_proj", "model.layers.64.mlp.experts.8.down_proj", "model.layers.64.mlp.experts.9.down_proj", "model.layers.64.mlp.experts.10.down_proj", "model.layers.64.mlp.experts.11.down_proj", "model.layers.64.mlp.experts.12.down_proj", "model.layers.64.mlp.experts.13.down_proj", "model.layers.64.mlp.experts.14.down_proj", "model.layers.64.mlp.experts.15.down_proj", "model.layers.64.mlp.experts.16.down_proj", "model.layers.64.mlp.experts.17.down_proj", "model.layers.64.mlp.experts.18.down_proj", "model.layers.64.mlp.experts.19.down_proj", "model.layers.64.mlp.experts.20.down_proj", "model.layers.64.mlp.experts.21.down_proj", "model.layers.64.mlp.experts.22.down_proj", "model.layers.64.mlp.experts.23.down_proj", "model.layers.64.mlp.experts.24.down_proj", "model.layers.64.mlp.experts.25.down_proj", "model.layers.64.mlp.experts.26.down_proj", "model.layers.64.mlp.experts.27.down_proj", "model.layers.64.mlp.experts.28.down_proj", "model.layers.64.mlp.experts.29.down_proj", "model.layers.64.mlp.experts.30.down_proj", "model.layers.64.mlp.experts.31.down_proj", "model.layers.64.mlp.experts.32.down_proj", "model.layers.64.mlp.experts.33.down_proj", "model.layers.64.mlp.experts.34.down_proj", "model.layers.64.mlp.experts.35.down_proj", "model.layers.64.mlp.experts.36.down_proj", "model.layers.64.mlp.experts.37.down_proj", "model.layers.64.mlp.experts.38.down_proj", "model.layers.64.mlp.experts.39.down_proj", "model.layers.64.mlp.experts.40.down_proj", "model.layers.64.mlp.experts.41.down_proj", "model.layers.64.mlp.experts.42.down_proj", "model.layers.64.mlp.experts.43.down_proj", "model.layers.64.mlp.experts.44.down_proj", "model.layers.64.mlp.experts.45.down_proj", "model.layers.64.mlp.experts.46.down_proj", "model.layers.64.mlp.experts.47.down_proj", "model.layers.64.mlp.experts.48.down_proj", "model.layers.64.mlp.experts.49.down_proj", "model.layers.64.mlp.experts.50.down_proj", "model.layers.64.mlp.experts.51.down_proj", "model.layers.64.mlp.experts.52.down_proj", "model.layers.64.mlp.experts.53.down_proj", "model.layers.64.mlp.experts.54.down_proj", "model.layers.64.mlp.experts.55.down_proj", "model.layers.64.mlp.experts.56.down_proj", "model.layers.64.mlp.experts.57.down_proj", "model.layers.64.mlp.experts.58.down_proj", "model.layers.64.mlp.experts.59.down_proj", "model.layers.64.mlp.experts.60.down_proj", "model.layers.64.mlp.experts.61.down_proj", "model.layers.64.mlp.experts.62.down_proj", "model.layers.64.mlp.experts.63.down_proj", "model.layers.64.mlp.experts.64.down_proj", "model.layers.64.mlp.experts.65.down_proj", "model.layers.64.mlp.experts.66.down_proj", "model.layers.64.mlp.experts.67.down_proj", "model.layers.64.mlp.experts.68.down_proj", "model.layers.64.mlp.experts.69.down_proj", "model.layers.64.mlp.experts.70.down_proj", "model.layers.64.mlp.experts.71.down_proj", "model.layers.64.mlp.experts.72.down_proj", "model.layers.64.mlp.experts.73.down_proj", "model.layers.64.mlp.experts.74.down_proj", "model.layers.64.mlp.experts.75.down_proj", "model.layers.64.mlp.experts.76.down_proj", "model.layers.64.mlp.experts.77.down_proj", "model.layers.64.mlp.experts.78.down_proj", "model.layers.64.mlp.experts.79.down_proj", "model.layers.64.mlp.experts.80.down_proj", "model.layers.64.mlp.experts.81.down_proj", "model.layers.64.mlp.experts.82.down_proj", "model.layers.64.mlp.experts.83.down_proj", "model.layers.64.mlp.experts.84.down_proj", "model.layers.64.mlp.experts.85.down_proj", "model.layers.64.mlp.experts.86.down_proj", "model.layers.64.mlp.experts.87.down_proj", "model.layers.64.mlp.experts.88.down_proj", "model.layers.64.mlp.experts.89.down_proj", "model.layers.64.mlp.experts.90.down_proj", "model.layers.64.mlp.experts.91.down_proj", "model.layers.64.mlp.experts.92.down_proj", "model.layers.64.mlp.experts.93.down_proj", "model.layers.64.mlp.experts.94.down_proj", "model.layers.64.mlp.experts.95.down_proj", "model.layers.64.mlp.experts.96.down_proj", "model.layers.64.mlp.experts.97.down_proj", "model.layers.64.mlp.experts.98.down_proj", "model.layers.64.mlp.experts.99.down_proj", "model.layers.64.mlp.experts.100.down_proj", "model.layers.64.mlp.experts.101.down_proj", "model.layers.64.mlp.experts.102.down_proj", "model.layers.64.mlp.experts.103.down_proj", "model.layers.64.mlp.experts.104.down_proj", "model.layers.64.mlp.experts.105.down_proj", "model.layers.64.mlp.experts.106.down_proj", "model.layers.64.mlp.experts.107.down_proj", "model.layers.64.mlp.experts.108.down_proj", "model.layers.64.mlp.experts.109.down_proj", "model.layers.64.mlp.experts.110.down_proj", "model.layers.64.mlp.experts.111.down_proj", "model.layers.64.mlp.experts.112.down_proj", "model.layers.64.mlp.experts.113.down_proj", "model.layers.64.mlp.experts.114.down_proj", "model.layers.64.mlp.experts.115.down_proj", "model.layers.64.mlp.experts.116.down_proj", "model.layers.64.mlp.experts.117.down_proj", "model.layers.64.mlp.experts.118.down_proj", "model.layers.64.mlp.experts.119.down_proj", "model.layers.64.mlp.experts.120.down_proj", "model.layers.64.mlp.experts.121.down_proj", "model.layers.64.mlp.experts.122.down_proj", "model.layers.64.mlp.experts.123.down_proj", "model.layers.64.mlp.experts.124.down_proj", "model.layers.64.mlp.experts.125.down_proj", "model.layers.64.mlp.experts.126.down_proj", "model.layers.64.mlp.experts.127.down_proj", "model.layers.64.mlp.experts.128.down_proj", "model.layers.64.mlp.experts.129.down_proj", "model.layers.64.mlp.experts.130.down_proj", "model.layers.64.mlp.experts.131.down_proj", "model.layers.64.mlp.experts.132.down_proj", "model.layers.64.mlp.experts.133.down_proj", "model.layers.64.mlp.experts.134.down_proj", "model.layers.64.mlp.experts.135.down_proj", "model.layers.64.mlp.experts.136.down_proj", "model.layers.64.mlp.experts.137.down_proj", "model.layers.64.mlp.experts.138.down_proj", "model.layers.64.mlp.experts.139.down_proj", "model.layers.64.mlp.experts.140.down_proj", "model.layers.64.mlp.experts.141.down_proj", "model.layers.64.mlp.experts.142.down_proj", "model.layers.64.mlp.experts.143.down_proj", "model.layers.64.mlp.experts.144.down_proj", "model.layers.64.mlp.experts.145.down_proj", "model.layers.64.mlp.experts.146.down_proj", "model.layers.64.mlp.experts.147.down_proj", "model.layers.64.mlp.experts.148.down_proj", "model.layers.64.mlp.experts.149.down_proj", "model.layers.64.mlp.experts.150.down_proj", "model.layers.64.mlp.experts.151.down_proj", "model.layers.64.mlp.experts.152.down_proj", "model.layers.64.mlp.experts.153.down_proj", "model.layers.64.mlp.experts.154.down_proj", "model.layers.64.mlp.experts.155.down_proj", "model.layers.64.mlp.experts.156.down_proj", "model.layers.64.mlp.experts.157.down_proj", "model.layers.64.mlp.experts.158.down_proj", "model.layers.64.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -7.747206836938858e-06, "dbits": 1258291200 }, { "dkld": -2.7587637305252766e-06, "dbits": 2516582400 } ] }, { "idx": 387, "layers": [ "model.layers.65.self_attn.q_proj" ], "candidates": [ { "dkld": 2.458142116665979e-05, "dbits": 62914560 }, { "dkld": 2.0116334781050682e-05, "dbits": 125829120 } ] }, { "idx": 388, "layers": [ "model.layers.65.self_attn.k_proj", "model.layers.65.self_attn.v_proj" ], "candidates": [ { "dkld": -4.698205739259685e-05, "dbits": 10485760 }, { "dkld": -1.9579101353882356e-05, "dbits": 20971520 } ] }, { "idx": 389, "layers": [ "model.layers.65.self_attn.o_proj" ], "candidates": [ { "dkld": -1.2529036030172608e-05, "dbits": 62914560 }, { "dkld": -8.438690565526138e-06, "dbits": 125829120 } ] }, { "idx": 390, "layers": [ "model.layers.65.mlp.shared_experts.gate_proj", "model.layers.65.mlp.shared_experts.up_proj", "model.layers.65.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 7.737427949905396e-06, "dbits": 23592960 }, { "dkld": -6.271689198910149e-06, "dbits": 47185920 } ] }, { "idx": 391, "layers": [ "model.layers.65.mlp.experts.0.gate_proj", "model.layers.65.mlp.experts.1.gate_proj", "model.layers.65.mlp.experts.2.gate_proj", "model.layers.65.mlp.experts.3.gate_proj", "model.layers.65.mlp.experts.4.gate_proj", "model.layers.65.mlp.experts.5.gate_proj", "model.layers.65.mlp.experts.6.gate_proj", "model.layers.65.mlp.experts.7.gate_proj", "model.layers.65.mlp.experts.8.gate_proj", "model.layers.65.mlp.experts.9.gate_proj", "model.layers.65.mlp.experts.10.gate_proj", "model.layers.65.mlp.experts.11.gate_proj", "model.layers.65.mlp.experts.12.gate_proj", "model.layers.65.mlp.experts.13.gate_proj", "model.layers.65.mlp.experts.14.gate_proj", "model.layers.65.mlp.experts.15.gate_proj", "model.layers.65.mlp.experts.16.gate_proj", "model.layers.65.mlp.experts.17.gate_proj", "model.layers.65.mlp.experts.18.gate_proj", "model.layers.65.mlp.experts.19.gate_proj", "model.layers.65.mlp.experts.20.gate_proj", "model.layers.65.mlp.experts.21.gate_proj", "model.layers.65.mlp.experts.22.gate_proj", "model.layers.65.mlp.experts.23.gate_proj", "model.layers.65.mlp.experts.24.gate_proj", "model.layers.65.mlp.experts.25.gate_proj", "model.layers.65.mlp.experts.26.gate_proj", "model.layers.65.mlp.experts.27.gate_proj", "model.layers.65.mlp.experts.28.gate_proj", "model.layers.65.mlp.experts.29.gate_proj", "model.layers.65.mlp.experts.30.gate_proj", "model.layers.65.mlp.experts.31.gate_proj", "model.layers.65.mlp.experts.32.gate_proj", "model.layers.65.mlp.experts.33.gate_proj", "model.layers.65.mlp.experts.34.gate_proj", "model.layers.65.mlp.experts.35.gate_proj", "model.layers.65.mlp.experts.36.gate_proj", "model.layers.65.mlp.experts.37.gate_proj", "model.layers.65.mlp.experts.38.gate_proj", "model.layers.65.mlp.experts.39.gate_proj", "model.layers.65.mlp.experts.40.gate_proj", "model.layers.65.mlp.experts.41.gate_proj", "model.layers.65.mlp.experts.42.gate_proj", "model.layers.65.mlp.experts.43.gate_proj", "model.layers.65.mlp.experts.44.gate_proj", "model.layers.65.mlp.experts.45.gate_proj", "model.layers.65.mlp.experts.46.gate_proj", "model.layers.65.mlp.experts.47.gate_proj", "model.layers.65.mlp.experts.48.gate_proj", "model.layers.65.mlp.experts.49.gate_proj", "model.layers.65.mlp.experts.50.gate_proj", "model.layers.65.mlp.experts.51.gate_proj", "model.layers.65.mlp.experts.52.gate_proj", "model.layers.65.mlp.experts.53.gate_proj", "model.layers.65.mlp.experts.54.gate_proj", "model.layers.65.mlp.experts.55.gate_proj", "model.layers.65.mlp.experts.56.gate_proj", "model.layers.65.mlp.experts.57.gate_proj", "model.layers.65.mlp.experts.58.gate_proj", "model.layers.65.mlp.experts.59.gate_proj", "model.layers.65.mlp.experts.60.gate_proj", "model.layers.65.mlp.experts.61.gate_proj", "model.layers.65.mlp.experts.62.gate_proj", "model.layers.65.mlp.experts.63.gate_proj", "model.layers.65.mlp.experts.64.gate_proj", "model.layers.65.mlp.experts.65.gate_proj", "model.layers.65.mlp.experts.66.gate_proj", "model.layers.65.mlp.experts.67.gate_proj", "model.layers.65.mlp.experts.68.gate_proj", "model.layers.65.mlp.experts.69.gate_proj", "model.layers.65.mlp.experts.70.gate_proj", "model.layers.65.mlp.experts.71.gate_proj", "model.layers.65.mlp.experts.72.gate_proj", "model.layers.65.mlp.experts.73.gate_proj", "model.layers.65.mlp.experts.74.gate_proj", "model.layers.65.mlp.experts.75.gate_proj", "model.layers.65.mlp.experts.76.gate_proj", "model.layers.65.mlp.experts.77.gate_proj", "model.layers.65.mlp.experts.78.gate_proj", "model.layers.65.mlp.experts.79.gate_proj", "model.layers.65.mlp.experts.80.gate_proj", "model.layers.65.mlp.experts.81.gate_proj", "model.layers.65.mlp.experts.82.gate_proj", "model.layers.65.mlp.experts.83.gate_proj", "model.layers.65.mlp.experts.84.gate_proj", "model.layers.65.mlp.experts.85.gate_proj", "model.layers.65.mlp.experts.86.gate_proj", "model.layers.65.mlp.experts.87.gate_proj", "model.layers.65.mlp.experts.88.gate_proj", "model.layers.65.mlp.experts.89.gate_proj", "model.layers.65.mlp.experts.90.gate_proj", "model.layers.65.mlp.experts.91.gate_proj", "model.layers.65.mlp.experts.92.gate_proj", "model.layers.65.mlp.experts.93.gate_proj", "model.layers.65.mlp.experts.94.gate_proj", "model.layers.65.mlp.experts.95.gate_proj", "model.layers.65.mlp.experts.96.gate_proj", "model.layers.65.mlp.experts.97.gate_proj", "model.layers.65.mlp.experts.98.gate_proj", "model.layers.65.mlp.experts.99.gate_proj", "model.layers.65.mlp.experts.100.gate_proj", "model.layers.65.mlp.experts.101.gate_proj", "model.layers.65.mlp.experts.102.gate_proj", "model.layers.65.mlp.experts.103.gate_proj", "model.layers.65.mlp.experts.104.gate_proj", "model.layers.65.mlp.experts.105.gate_proj", "model.layers.65.mlp.experts.106.gate_proj", "model.layers.65.mlp.experts.107.gate_proj", "model.layers.65.mlp.experts.108.gate_proj", "model.layers.65.mlp.experts.109.gate_proj", "model.layers.65.mlp.experts.110.gate_proj", "model.layers.65.mlp.experts.111.gate_proj", "model.layers.65.mlp.experts.112.gate_proj", "model.layers.65.mlp.experts.113.gate_proj", "model.layers.65.mlp.experts.114.gate_proj", "model.layers.65.mlp.experts.115.gate_proj", "model.layers.65.mlp.experts.116.gate_proj", "model.layers.65.mlp.experts.117.gate_proj", "model.layers.65.mlp.experts.118.gate_proj", "model.layers.65.mlp.experts.119.gate_proj", "model.layers.65.mlp.experts.120.gate_proj", "model.layers.65.mlp.experts.121.gate_proj", "model.layers.65.mlp.experts.122.gate_proj", "model.layers.65.mlp.experts.123.gate_proj", "model.layers.65.mlp.experts.124.gate_proj", "model.layers.65.mlp.experts.125.gate_proj", "model.layers.65.mlp.experts.126.gate_proj", "model.layers.65.mlp.experts.127.gate_proj", "model.layers.65.mlp.experts.128.gate_proj", "model.layers.65.mlp.experts.129.gate_proj", "model.layers.65.mlp.experts.130.gate_proj", "model.layers.65.mlp.experts.131.gate_proj", "model.layers.65.mlp.experts.132.gate_proj", "model.layers.65.mlp.experts.133.gate_proj", "model.layers.65.mlp.experts.134.gate_proj", "model.layers.65.mlp.experts.135.gate_proj", "model.layers.65.mlp.experts.136.gate_proj", "model.layers.65.mlp.experts.137.gate_proj", "model.layers.65.mlp.experts.138.gate_proj", "model.layers.65.mlp.experts.139.gate_proj", "model.layers.65.mlp.experts.140.gate_proj", "model.layers.65.mlp.experts.141.gate_proj", "model.layers.65.mlp.experts.142.gate_proj", "model.layers.65.mlp.experts.143.gate_proj", "model.layers.65.mlp.experts.144.gate_proj", "model.layers.65.mlp.experts.145.gate_proj", "model.layers.65.mlp.experts.146.gate_proj", "model.layers.65.mlp.experts.147.gate_proj", "model.layers.65.mlp.experts.148.gate_proj", "model.layers.65.mlp.experts.149.gate_proj", "model.layers.65.mlp.experts.150.gate_proj", "model.layers.65.mlp.experts.151.gate_proj", "model.layers.65.mlp.experts.152.gate_proj", "model.layers.65.mlp.experts.153.gate_proj", "model.layers.65.mlp.experts.154.gate_proj", "model.layers.65.mlp.experts.155.gate_proj", "model.layers.65.mlp.experts.156.gate_proj", "model.layers.65.mlp.experts.157.gate_proj", "model.layers.65.mlp.experts.158.gate_proj", "model.layers.65.mlp.experts.159.gate_proj", "model.layers.65.mlp.experts.0.up_proj", "model.layers.65.mlp.experts.1.up_proj", "model.layers.65.mlp.experts.2.up_proj", "model.layers.65.mlp.experts.3.up_proj", "model.layers.65.mlp.experts.4.up_proj", "model.layers.65.mlp.experts.5.up_proj", "model.layers.65.mlp.experts.6.up_proj", "model.layers.65.mlp.experts.7.up_proj", "model.layers.65.mlp.experts.8.up_proj", "model.layers.65.mlp.experts.9.up_proj", "model.layers.65.mlp.experts.10.up_proj", "model.layers.65.mlp.experts.11.up_proj", "model.layers.65.mlp.experts.12.up_proj", "model.layers.65.mlp.experts.13.up_proj", "model.layers.65.mlp.experts.14.up_proj", "model.layers.65.mlp.experts.15.up_proj", "model.layers.65.mlp.experts.16.up_proj", "model.layers.65.mlp.experts.17.up_proj", "model.layers.65.mlp.experts.18.up_proj", "model.layers.65.mlp.experts.19.up_proj", "model.layers.65.mlp.experts.20.up_proj", "model.layers.65.mlp.experts.21.up_proj", "model.layers.65.mlp.experts.22.up_proj", "model.layers.65.mlp.experts.23.up_proj", "model.layers.65.mlp.experts.24.up_proj", "model.layers.65.mlp.experts.25.up_proj", "model.layers.65.mlp.experts.26.up_proj", "model.layers.65.mlp.experts.27.up_proj", "model.layers.65.mlp.experts.28.up_proj", "model.layers.65.mlp.experts.29.up_proj", "model.layers.65.mlp.experts.30.up_proj", "model.layers.65.mlp.experts.31.up_proj", "model.layers.65.mlp.experts.32.up_proj", "model.layers.65.mlp.experts.33.up_proj", "model.layers.65.mlp.experts.34.up_proj", "model.layers.65.mlp.experts.35.up_proj", "model.layers.65.mlp.experts.36.up_proj", "model.layers.65.mlp.experts.37.up_proj", "model.layers.65.mlp.experts.38.up_proj", "model.layers.65.mlp.experts.39.up_proj", "model.layers.65.mlp.experts.40.up_proj", "model.layers.65.mlp.experts.41.up_proj", "model.layers.65.mlp.experts.42.up_proj", "model.layers.65.mlp.experts.43.up_proj", "model.layers.65.mlp.experts.44.up_proj", "model.layers.65.mlp.experts.45.up_proj", "model.layers.65.mlp.experts.46.up_proj", "model.layers.65.mlp.experts.47.up_proj", "model.layers.65.mlp.experts.48.up_proj", "model.layers.65.mlp.experts.49.up_proj", "model.layers.65.mlp.experts.50.up_proj", "model.layers.65.mlp.experts.51.up_proj", "model.layers.65.mlp.experts.52.up_proj", "model.layers.65.mlp.experts.53.up_proj", "model.layers.65.mlp.experts.54.up_proj", "model.layers.65.mlp.experts.55.up_proj", "model.layers.65.mlp.experts.56.up_proj", "model.layers.65.mlp.experts.57.up_proj", "model.layers.65.mlp.experts.58.up_proj", "model.layers.65.mlp.experts.59.up_proj", "model.layers.65.mlp.experts.60.up_proj", "model.layers.65.mlp.experts.61.up_proj", "model.layers.65.mlp.experts.62.up_proj", "model.layers.65.mlp.experts.63.up_proj", "model.layers.65.mlp.experts.64.up_proj", "model.layers.65.mlp.experts.65.up_proj", "model.layers.65.mlp.experts.66.up_proj", "model.layers.65.mlp.experts.67.up_proj", "model.layers.65.mlp.experts.68.up_proj", "model.layers.65.mlp.experts.69.up_proj", "model.layers.65.mlp.experts.70.up_proj", "model.layers.65.mlp.experts.71.up_proj", "model.layers.65.mlp.experts.72.up_proj", "model.layers.65.mlp.experts.73.up_proj", "model.layers.65.mlp.experts.74.up_proj", "model.layers.65.mlp.experts.75.up_proj", "model.layers.65.mlp.experts.76.up_proj", "model.layers.65.mlp.experts.77.up_proj", "model.layers.65.mlp.experts.78.up_proj", "model.layers.65.mlp.experts.79.up_proj", "model.layers.65.mlp.experts.80.up_proj", "model.layers.65.mlp.experts.81.up_proj", "model.layers.65.mlp.experts.82.up_proj", "model.layers.65.mlp.experts.83.up_proj", "model.layers.65.mlp.experts.84.up_proj", "model.layers.65.mlp.experts.85.up_proj", "model.layers.65.mlp.experts.86.up_proj", "model.layers.65.mlp.experts.87.up_proj", "model.layers.65.mlp.experts.88.up_proj", "model.layers.65.mlp.experts.89.up_proj", "model.layers.65.mlp.experts.90.up_proj", "model.layers.65.mlp.experts.91.up_proj", "model.layers.65.mlp.experts.92.up_proj", "model.layers.65.mlp.experts.93.up_proj", "model.layers.65.mlp.experts.94.up_proj", "model.layers.65.mlp.experts.95.up_proj", "model.layers.65.mlp.experts.96.up_proj", "model.layers.65.mlp.experts.97.up_proj", "model.layers.65.mlp.experts.98.up_proj", "model.layers.65.mlp.experts.99.up_proj", "model.layers.65.mlp.experts.100.up_proj", "model.layers.65.mlp.experts.101.up_proj", "model.layers.65.mlp.experts.102.up_proj", "model.layers.65.mlp.experts.103.up_proj", "model.layers.65.mlp.experts.104.up_proj", "model.layers.65.mlp.experts.105.up_proj", "model.layers.65.mlp.experts.106.up_proj", "model.layers.65.mlp.experts.107.up_proj", "model.layers.65.mlp.experts.108.up_proj", "model.layers.65.mlp.experts.109.up_proj", "model.layers.65.mlp.experts.110.up_proj", "model.layers.65.mlp.experts.111.up_proj", "model.layers.65.mlp.experts.112.up_proj", "model.layers.65.mlp.experts.113.up_proj", "model.layers.65.mlp.experts.114.up_proj", "model.layers.65.mlp.experts.115.up_proj", "model.layers.65.mlp.experts.116.up_proj", "model.layers.65.mlp.experts.117.up_proj", "model.layers.65.mlp.experts.118.up_proj", "model.layers.65.mlp.experts.119.up_proj", "model.layers.65.mlp.experts.120.up_proj", "model.layers.65.mlp.experts.121.up_proj", "model.layers.65.mlp.experts.122.up_proj", "model.layers.65.mlp.experts.123.up_proj", "model.layers.65.mlp.experts.124.up_proj", "model.layers.65.mlp.experts.125.up_proj", "model.layers.65.mlp.experts.126.up_proj", "model.layers.65.mlp.experts.127.up_proj", "model.layers.65.mlp.experts.128.up_proj", "model.layers.65.mlp.experts.129.up_proj", "model.layers.65.mlp.experts.130.up_proj", "model.layers.65.mlp.experts.131.up_proj", "model.layers.65.mlp.experts.132.up_proj", "model.layers.65.mlp.experts.133.up_proj", "model.layers.65.mlp.experts.134.up_proj", "model.layers.65.mlp.experts.135.up_proj", "model.layers.65.mlp.experts.136.up_proj", "model.layers.65.mlp.experts.137.up_proj", "model.layers.65.mlp.experts.138.up_proj", "model.layers.65.mlp.experts.139.up_proj", "model.layers.65.mlp.experts.140.up_proj", "model.layers.65.mlp.experts.141.up_proj", "model.layers.65.mlp.experts.142.up_proj", "model.layers.65.mlp.experts.143.up_proj", "model.layers.65.mlp.experts.144.up_proj", "model.layers.65.mlp.experts.145.up_proj", "model.layers.65.mlp.experts.146.up_proj", "model.layers.65.mlp.experts.147.up_proj", "model.layers.65.mlp.experts.148.up_proj", "model.layers.65.mlp.experts.149.up_proj", "model.layers.65.mlp.experts.150.up_proj", "model.layers.65.mlp.experts.151.up_proj", "model.layers.65.mlp.experts.152.up_proj", "model.layers.65.mlp.experts.153.up_proj", "model.layers.65.mlp.experts.154.up_proj", "model.layers.65.mlp.experts.155.up_proj", "model.layers.65.mlp.experts.156.up_proj", "model.layers.65.mlp.experts.157.up_proj", "model.layers.65.mlp.experts.158.up_proj", "model.layers.65.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 3.7123914808038366e-06, "dbits": 2516582400 }, { "dkld": -7.450720295308633e-06, "dbits": 5033164800 } ] }, { "idx": 392, "layers": [ "model.layers.65.mlp.experts.0.down_proj", "model.layers.65.mlp.experts.1.down_proj", "model.layers.65.mlp.experts.2.down_proj", "model.layers.65.mlp.experts.3.down_proj", "model.layers.65.mlp.experts.4.down_proj", "model.layers.65.mlp.experts.5.down_proj", "model.layers.65.mlp.experts.6.down_proj", "model.layers.65.mlp.experts.7.down_proj", "model.layers.65.mlp.experts.8.down_proj", "model.layers.65.mlp.experts.9.down_proj", "model.layers.65.mlp.experts.10.down_proj", "model.layers.65.mlp.experts.11.down_proj", "model.layers.65.mlp.experts.12.down_proj", "model.layers.65.mlp.experts.13.down_proj", "model.layers.65.mlp.experts.14.down_proj", "model.layers.65.mlp.experts.15.down_proj", "model.layers.65.mlp.experts.16.down_proj", "model.layers.65.mlp.experts.17.down_proj", "model.layers.65.mlp.experts.18.down_proj", "model.layers.65.mlp.experts.19.down_proj", "model.layers.65.mlp.experts.20.down_proj", "model.layers.65.mlp.experts.21.down_proj", "model.layers.65.mlp.experts.22.down_proj", "model.layers.65.mlp.experts.23.down_proj", "model.layers.65.mlp.experts.24.down_proj", "model.layers.65.mlp.experts.25.down_proj", "model.layers.65.mlp.experts.26.down_proj", "model.layers.65.mlp.experts.27.down_proj", "model.layers.65.mlp.experts.28.down_proj", "model.layers.65.mlp.experts.29.down_proj", "model.layers.65.mlp.experts.30.down_proj", "model.layers.65.mlp.experts.31.down_proj", "model.layers.65.mlp.experts.32.down_proj", "model.layers.65.mlp.experts.33.down_proj", "model.layers.65.mlp.experts.34.down_proj", "model.layers.65.mlp.experts.35.down_proj", "model.layers.65.mlp.experts.36.down_proj", "model.layers.65.mlp.experts.37.down_proj", "model.layers.65.mlp.experts.38.down_proj", "model.layers.65.mlp.experts.39.down_proj", "model.layers.65.mlp.experts.40.down_proj", "model.layers.65.mlp.experts.41.down_proj", "model.layers.65.mlp.experts.42.down_proj", "model.layers.65.mlp.experts.43.down_proj", "model.layers.65.mlp.experts.44.down_proj", "model.layers.65.mlp.experts.45.down_proj", "model.layers.65.mlp.experts.46.down_proj", "model.layers.65.mlp.experts.47.down_proj", "model.layers.65.mlp.experts.48.down_proj", "model.layers.65.mlp.experts.49.down_proj", "model.layers.65.mlp.experts.50.down_proj", "model.layers.65.mlp.experts.51.down_proj", "model.layers.65.mlp.experts.52.down_proj", "model.layers.65.mlp.experts.53.down_proj", "model.layers.65.mlp.experts.54.down_proj", "model.layers.65.mlp.experts.55.down_proj", "model.layers.65.mlp.experts.56.down_proj", "model.layers.65.mlp.experts.57.down_proj", "model.layers.65.mlp.experts.58.down_proj", "model.layers.65.mlp.experts.59.down_proj", "model.layers.65.mlp.experts.60.down_proj", "model.layers.65.mlp.experts.61.down_proj", "model.layers.65.mlp.experts.62.down_proj", "model.layers.65.mlp.experts.63.down_proj", "model.layers.65.mlp.experts.64.down_proj", "model.layers.65.mlp.experts.65.down_proj", "model.layers.65.mlp.experts.66.down_proj", "model.layers.65.mlp.experts.67.down_proj", "model.layers.65.mlp.experts.68.down_proj", "model.layers.65.mlp.experts.69.down_proj", "model.layers.65.mlp.experts.70.down_proj", "model.layers.65.mlp.experts.71.down_proj", "model.layers.65.mlp.experts.72.down_proj", "model.layers.65.mlp.experts.73.down_proj", "model.layers.65.mlp.experts.74.down_proj", "model.layers.65.mlp.experts.75.down_proj", "model.layers.65.mlp.experts.76.down_proj", "model.layers.65.mlp.experts.77.down_proj", "model.layers.65.mlp.experts.78.down_proj", "model.layers.65.mlp.experts.79.down_proj", "model.layers.65.mlp.experts.80.down_proj", "model.layers.65.mlp.experts.81.down_proj", "model.layers.65.mlp.experts.82.down_proj", "model.layers.65.mlp.experts.83.down_proj", "model.layers.65.mlp.experts.84.down_proj", "model.layers.65.mlp.experts.85.down_proj", "model.layers.65.mlp.experts.86.down_proj", "model.layers.65.mlp.experts.87.down_proj", "model.layers.65.mlp.experts.88.down_proj", "model.layers.65.mlp.experts.89.down_proj", "model.layers.65.mlp.experts.90.down_proj", "model.layers.65.mlp.experts.91.down_proj", "model.layers.65.mlp.experts.92.down_proj", "model.layers.65.mlp.experts.93.down_proj", "model.layers.65.mlp.experts.94.down_proj", "model.layers.65.mlp.experts.95.down_proj", "model.layers.65.mlp.experts.96.down_proj", "model.layers.65.mlp.experts.97.down_proj", "model.layers.65.mlp.experts.98.down_proj", "model.layers.65.mlp.experts.99.down_proj", "model.layers.65.mlp.experts.100.down_proj", "model.layers.65.mlp.experts.101.down_proj", "model.layers.65.mlp.experts.102.down_proj", "model.layers.65.mlp.experts.103.down_proj", "model.layers.65.mlp.experts.104.down_proj", "model.layers.65.mlp.experts.105.down_proj", "model.layers.65.mlp.experts.106.down_proj", "model.layers.65.mlp.experts.107.down_proj", "model.layers.65.mlp.experts.108.down_proj", "model.layers.65.mlp.experts.109.down_proj", "model.layers.65.mlp.experts.110.down_proj", "model.layers.65.mlp.experts.111.down_proj", "model.layers.65.mlp.experts.112.down_proj", "model.layers.65.mlp.experts.113.down_proj", "model.layers.65.mlp.experts.114.down_proj", "model.layers.65.mlp.experts.115.down_proj", "model.layers.65.mlp.experts.116.down_proj", "model.layers.65.mlp.experts.117.down_proj", "model.layers.65.mlp.experts.118.down_proj", "model.layers.65.mlp.experts.119.down_proj", "model.layers.65.mlp.experts.120.down_proj", "model.layers.65.mlp.experts.121.down_proj", "model.layers.65.mlp.experts.122.down_proj", "model.layers.65.mlp.experts.123.down_proj", "model.layers.65.mlp.experts.124.down_proj", "model.layers.65.mlp.experts.125.down_proj", "model.layers.65.mlp.experts.126.down_proj", "model.layers.65.mlp.experts.127.down_proj", "model.layers.65.mlp.experts.128.down_proj", "model.layers.65.mlp.experts.129.down_proj", "model.layers.65.mlp.experts.130.down_proj", "model.layers.65.mlp.experts.131.down_proj", "model.layers.65.mlp.experts.132.down_proj", "model.layers.65.mlp.experts.133.down_proj", "model.layers.65.mlp.experts.134.down_proj", "model.layers.65.mlp.experts.135.down_proj", "model.layers.65.mlp.experts.136.down_proj", "model.layers.65.mlp.experts.137.down_proj", "model.layers.65.mlp.experts.138.down_proj", "model.layers.65.mlp.experts.139.down_proj", "model.layers.65.mlp.experts.140.down_proj", "model.layers.65.mlp.experts.141.down_proj", "model.layers.65.mlp.experts.142.down_proj", "model.layers.65.mlp.experts.143.down_proj", "model.layers.65.mlp.experts.144.down_proj", "model.layers.65.mlp.experts.145.down_proj", "model.layers.65.mlp.experts.146.down_proj", "model.layers.65.mlp.experts.147.down_proj", "model.layers.65.mlp.experts.148.down_proj", "model.layers.65.mlp.experts.149.down_proj", "model.layers.65.mlp.experts.150.down_proj", "model.layers.65.mlp.experts.151.down_proj", "model.layers.65.mlp.experts.152.down_proj", "model.layers.65.mlp.experts.153.down_proj", "model.layers.65.mlp.experts.154.down_proj", "model.layers.65.mlp.experts.155.down_proj", "model.layers.65.mlp.experts.156.down_proj", "model.layers.65.mlp.experts.157.down_proj", "model.layers.65.mlp.experts.158.down_proj", "model.layers.65.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 1.5849689953030544e-05, "dbits": 1258291200 }, { "dkld": 1.7096078954637398e-05, "dbits": 2516582400 } ] }, { "idx": 393, "layers": [ "model.layers.66.self_attn.q_proj" ], "candidates": [ { "dkld": -7.726438343524933e-05, "dbits": 62914560 }, { "dkld": -7.976454216986756e-05, "dbits": 125829120 } ] }, { "idx": 394, "layers": [ "model.layers.66.self_attn.k_proj", "model.layers.66.self_attn.v_proj" ], "candidates": [ { "dkld": -1.0521244257688175e-05, "dbits": 10485760 }, { "dkld": 9.39471647143364e-07, "dbits": 20971520 } ] }, { "idx": 395, "layers": [ "model.layers.66.self_attn.o_proj" ], "candidates": [ { "dkld": -1.0534771718084812e-05, "dbits": 62914560 }, { "dkld": 5.908287130297618e-06, "dbits": 125829120 } ] }, { "idx": 396, "layers": [ "model.layers.66.mlp.shared_experts.gate_proj", "model.layers.66.mlp.shared_experts.up_proj", "model.layers.66.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -4.9162446521221204e-05, "dbits": 23592960 }, { "dkld": -3.2051885500549576e-05, "dbits": 47185920 } ] }, { "idx": 397, "layers": [ "model.layers.66.mlp.experts.0.gate_proj", "model.layers.66.mlp.experts.1.gate_proj", "model.layers.66.mlp.experts.2.gate_proj", "model.layers.66.mlp.experts.3.gate_proj", "model.layers.66.mlp.experts.4.gate_proj", "model.layers.66.mlp.experts.5.gate_proj", "model.layers.66.mlp.experts.6.gate_proj", "model.layers.66.mlp.experts.7.gate_proj", "model.layers.66.mlp.experts.8.gate_proj", "model.layers.66.mlp.experts.9.gate_proj", "model.layers.66.mlp.experts.10.gate_proj", "model.layers.66.mlp.experts.11.gate_proj", "model.layers.66.mlp.experts.12.gate_proj", "model.layers.66.mlp.experts.13.gate_proj", "model.layers.66.mlp.experts.14.gate_proj", "model.layers.66.mlp.experts.15.gate_proj", "model.layers.66.mlp.experts.16.gate_proj", "model.layers.66.mlp.experts.17.gate_proj", "model.layers.66.mlp.experts.18.gate_proj", "model.layers.66.mlp.experts.19.gate_proj", "model.layers.66.mlp.experts.20.gate_proj", "model.layers.66.mlp.experts.21.gate_proj", "model.layers.66.mlp.experts.22.gate_proj", "model.layers.66.mlp.experts.23.gate_proj", "model.layers.66.mlp.experts.24.gate_proj", "model.layers.66.mlp.experts.25.gate_proj", "model.layers.66.mlp.experts.26.gate_proj", "model.layers.66.mlp.experts.27.gate_proj", "model.layers.66.mlp.experts.28.gate_proj", "model.layers.66.mlp.experts.29.gate_proj", "model.layers.66.mlp.experts.30.gate_proj", "model.layers.66.mlp.experts.31.gate_proj", "model.layers.66.mlp.experts.32.gate_proj", "model.layers.66.mlp.experts.33.gate_proj", "model.layers.66.mlp.experts.34.gate_proj", "model.layers.66.mlp.experts.35.gate_proj", "model.layers.66.mlp.experts.36.gate_proj", "model.layers.66.mlp.experts.37.gate_proj", "model.layers.66.mlp.experts.38.gate_proj", "model.layers.66.mlp.experts.39.gate_proj", "model.layers.66.mlp.experts.40.gate_proj", "model.layers.66.mlp.experts.41.gate_proj", "model.layers.66.mlp.experts.42.gate_proj", "model.layers.66.mlp.experts.43.gate_proj", "model.layers.66.mlp.experts.44.gate_proj", "model.layers.66.mlp.experts.45.gate_proj", "model.layers.66.mlp.experts.46.gate_proj", "model.layers.66.mlp.experts.47.gate_proj", "model.layers.66.mlp.experts.48.gate_proj", "model.layers.66.mlp.experts.49.gate_proj", "model.layers.66.mlp.experts.50.gate_proj", "model.layers.66.mlp.experts.51.gate_proj", "model.layers.66.mlp.experts.52.gate_proj", "model.layers.66.mlp.experts.53.gate_proj", "model.layers.66.mlp.experts.54.gate_proj", "model.layers.66.mlp.experts.55.gate_proj", "model.layers.66.mlp.experts.56.gate_proj", "model.layers.66.mlp.experts.57.gate_proj", "model.layers.66.mlp.experts.58.gate_proj", "model.layers.66.mlp.experts.59.gate_proj", "model.layers.66.mlp.experts.60.gate_proj", "model.layers.66.mlp.experts.61.gate_proj", "model.layers.66.mlp.experts.62.gate_proj", "model.layers.66.mlp.experts.63.gate_proj", "model.layers.66.mlp.experts.64.gate_proj", "model.layers.66.mlp.experts.65.gate_proj", "model.layers.66.mlp.experts.66.gate_proj", "model.layers.66.mlp.experts.67.gate_proj", "model.layers.66.mlp.experts.68.gate_proj", "model.layers.66.mlp.experts.69.gate_proj", "model.layers.66.mlp.experts.70.gate_proj", "model.layers.66.mlp.experts.71.gate_proj", "model.layers.66.mlp.experts.72.gate_proj", "model.layers.66.mlp.experts.73.gate_proj", "model.layers.66.mlp.experts.74.gate_proj", "model.layers.66.mlp.experts.75.gate_proj", "model.layers.66.mlp.experts.76.gate_proj", "model.layers.66.mlp.experts.77.gate_proj", "model.layers.66.mlp.experts.78.gate_proj", "model.layers.66.mlp.experts.79.gate_proj", "model.layers.66.mlp.experts.80.gate_proj", "model.layers.66.mlp.experts.81.gate_proj", "model.layers.66.mlp.experts.82.gate_proj", "model.layers.66.mlp.experts.83.gate_proj", "model.layers.66.mlp.experts.84.gate_proj", "model.layers.66.mlp.experts.85.gate_proj", "model.layers.66.mlp.experts.86.gate_proj", "model.layers.66.mlp.experts.87.gate_proj", "model.layers.66.mlp.experts.88.gate_proj", "model.layers.66.mlp.experts.89.gate_proj", "model.layers.66.mlp.experts.90.gate_proj", "model.layers.66.mlp.experts.91.gate_proj", "model.layers.66.mlp.experts.92.gate_proj", "model.layers.66.mlp.experts.93.gate_proj", "model.layers.66.mlp.experts.94.gate_proj", "model.layers.66.mlp.experts.95.gate_proj", "model.layers.66.mlp.experts.96.gate_proj", "model.layers.66.mlp.experts.97.gate_proj", "model.layers.66.mlp.experts.98.gate_proj", "model.layers.66.mlp.experts.99.gate_proj", "model.layers.66.mlp.experts.100.gate_proj", "model.layers.66.mlp.experts.101.gate_proj", "model.layers.66.mlp.experts.102.gate_proj", "model.layers.66.mlp.experts.103.gate_proj", "model.layers.66.mlp.experts.104.gate_proj", "model.layers.66.mlp.experts.105.gate_proj", "model.layers.66.mlp.experts.106.gate_proj", "model.layers.66.mlp.experts.107.gate_proj", "model.layers.66.mlp.experts.108.gate_proj", "model.layers.66.mlp.experts.109.gate_proj", "model.layers.66.mlp.experts.110.gate_proj", "model.layers.66.mlp.experts.111.gate_proj", "model.layers.66.mlp.experts.112.gate_proj", "model.layers.66.mlp.experts.113.gate_proj", "model.layers.66.mlp.experts.114.gate_proj", "model.layers.66.mlp.experts.115.gate_proj", "model.layers.66.mlp.experts.116.gate_proj", "model.layers.66.mlp.experts.117.gate_proj", "model.layers.66.mlp.experts.118.gate_proj", "model.layers.66.mlp.experts.119.gate_proj", "model.layers.66.mlp.experts.120.gate_proj", "model.layers.66.mlp.experts.121.gate_proj", "model.layers.66.mlp.experts.122.gate_proj", "model.layers.66.mlp.experts.123.gate_proj", "model.layers.66.mlp.experts.124.gate_proj", "model.layers.66.mlp.experts.125.gate_proj", "model.layers.66.mlp.experts.126.gate_proj", "model.layers.66.mlp.experts.127.gate_proj", "model.layers.66.mlp.experts.128.gate_proj", "model.layers.66.mlp.experts.129.gate_proj", "model.layers.66.mlp.experts.130.gate_proj", "model.layers.66.mlp.experts.131.gate_proj", "model.layers.66.mlp.experts.132.gate_proj", "model.layers.66.mlp.experts.133.gate_proj", "model.layers.66.mlp.experts.134.gate_proj", "model.layers.66.mlp.experts.135.gate_proj", "model.layers.66.mlp.experts.136.gate_proj", "model.layers.66.mlp.experts.137.gate_proj", "model.layers.66.mlp.experts.138.gate_proj", "model.layers.66.mlp.experts.139.gate_proj", "model.layers.66.mlp.experts.140.gate_proj", "model.layers.66.mlp.experts.141.gate_proj", "model.layers.66.mlp.experts.142.gate_proj", "model.layers.66.mlp.experts.143.gate_proj", "model.layers.66.mlp.experts.144.gate_proj", "model.layers.66.mlp.experts.145.gate_proj", "model.layers.66.mlp.experts.146.gate_proj", "model.layers.66.mlp.experts.147.gate_proj", "model.layers.66.mlp.experts.148.gate_proj", "model.layers.66.mlp.experts.149.gate_proj", "model.layers.66.mlp.experts.150.gate_proj", "model.layers.66.mlp.experts.151.gate_proj", "model.layers.66.mlp.experts.152.gate_proj", "model.layers.66.mlp.experts.153.gate_proj", "model.layers.66.mlp.experts.154.gate_proj", "model.layers.66.mlp.experts.155.gate_proj", "model.layers.66.mlp.experts.156.gate_proj", "model.layers.66.mlp.experts.157.gate_proj", "model.layers.66.mlp.experts.158.gate_proj", "model.layers.66.mlp.experts.159.gate_proj", "model.layers.66.mlp.experts.0.up_proj", "model.layers.66.mlp.experts.1.up_proj", "model.layers.66.mlp.experts.2.up_proj", "model.layers.66.mlp.experts.3.up_proj", "model.layers.66.mlp.experts.4.up_proj", "model.layers.66.mlp.experts.5.up_proj", "model.layers.66.mlp.experts.6.up_proj", "model.layers.66.mlp.experts.7.up_proj", "model.layers.66.mlp.experts.8.up_proj", "model.layers.66.mlp.experts.9.up_proj", "model.layers.66.mlp.experts.10.up_proj", "model.layers.66.mlp.experts.11.up_proj", "model.layers.66.mlp.experts.12.up_proj", "model.layers.66.mlp.experts.13.up_proj", "model.layers.66.mlp.experts.14.up_proj", "model.layers.66.mlp.experts.15.up_proj", "model.layers.66.mlp.experts.16.up_proj", "model.layers.66.mlp.experts.17.up_proj", "model.layers.66.mlp.experts.18.up_proj", "model.layers.66.mlp.experts.19.up_proj", "model.layers.66.mlp.experts.20.up_proj", "model.layers.66.mlp.experts.21.up_proj", "model.layers.66.mlp.experts.22.up_proj", "model.layers.66.mlp.experts.23.up_proj", "model.layers.66.mlp.experts.24.up_proj", "model.layers.66.mlp.experts.25.up_proj", "model.layers.66.mlp.experts.26.up_proj", "model.layers.66.mlp.experts.27.up_proj", "model.layers.66.mlp.experts.28.up_proj", "model.layers.66.mlp.experts.29.up_proj", "model.layers.66.mlp.experts.30.up_proj", "model.layers.66.mlp.experts.31.up_proj", "model.layers.66.mlp.experts.32.up_proj", "model.layers.66.mlp.experts.33.up_proj", "model.layers.66.mlp.experts.34.up_proj", "model.layers.66.mlp.experts.35.up_proj", "model.layers.66.mlp.experts.36.up_proj", "model.layers.66.mlp.experts.37.up_proj", "model.layers.66.mlp.experts.38.up_proj", "model.layers.66.mlp.experts.39.up_proj", "model.layers.66.mlp.experts.40.up_proj", "model.layers.66.mlp.experts.41.up_proj", "model.layers.66.mlp.experts.42.up_proj", "model.layers.66.mlp.experts.43.up_proj", "model.layers.66.mlp.experts.44.up_proj", "model.layers.66.mlp.experts.45.up_proj", "model.layers.66.mlp.experts.46.up_proj", "model.layers.66.mlp.experts.47.up_proj", "model.layers.66.mlp.experts.48.up_proj", "model.layers.66.mlp.experts.49.up_proj", "model.layers.66.mlp.experts.50.up_proj", "model.layers.66.mlp.experts.51.up_proj", "model.layers.66.mlp.experts.52.up_proj", "model.layers.66.mlp.experts.53.up_proj", "model.layers.66.mlp.experts.54.up_proj", "model.layers.66.mlp.experts.55.up_proj", "model.layers.66.mlp.experts.56.up_proj", "model.layers.66.mlp.experts.57.up_proj", "model.layers.66.mlp.experts.58.up_proj", "model.layers.66.mlp.experts.59.up_proj", "model.layers.66.mlp.experts.60.up_proj", "model.layers.66.mlp.experts.61.up_proj", "model.layers.66.mlp.experts.62.up_proj", "model.layers.66.mlp.experts.63.up_proj", "model.layers.66.mlp.experts.64.up_proj", "model.layers.66.mlp.experts.65.up_proj", "model.layers.66.mlp.experts.66.up_proj", "model.layers.66.mlp.experts.67.up_proj", "model.layers.66.mlp.experts.68.up_proj", "model.layers.66.mlp.experts.69.up_proj", "model.layers.66.mlp.experts.70.up_proj", "model.layers.66.mlp.experts.71.up_proj", "model.layers.66.mlp.experts.72.up_proj", "model.layers.66.mlp.experts.73.up_proj", "model.layers.66.mlp.experts.74.up_proj", "model.layers.66.mlp.experts.75.up_proj", "model.layers.66.mlp.experts.76.up_proj", "model.layers.66.mlp.experts.77.up_proj", "model.layers.66.mlp.experts.78.up_proj", "model.layers.66.mlp.experts.79.up_proj", "model.layers.66.mlp.experts.80.up_proj", "model.layers.66.mlp.experts.81.up_proj", "model.layers.66.mlp.experts.82.up_proj", "model.layers.66.mlp.experts.83.up_proj", "model.layers.66.mlp.experts.84.up_proj", "model.layers.66.mlp.experts.85.up_proj", "model.layers.66.mlp.experts.86.up_proj", "model.layers.66.mlp.experts.87.up_proj", "model.layers.66.mlp.experts.88.up_proj", "model.layers.66.mlp.experts.89.up_proj", "model.layers.66.mlp.experts.90.up_proj", "model.layers.66.mlp.experts.91.up_proj", "model.layers.66.mlp.experts.92.up_proj", "model.layers.66.mlp.experts.93.up_proj", "model.layers.66.mlp.experts.94.up_proj", "model.layers.66.mlp.experts.95.up_proj", "model.layers.66.mlp.experts.96.up_proj", "model.layers.66.mlp.experts.97.up_proj", "model.layers.66.mlp.experts.98.up_proj", "model.layers.66.mlp.experts.99.up_proj", "model.layers.66.mlp.experts.100.up_proj", "model.layers.66.mlp.experts.101.up_proj", "model.layers.66.mlp.experts.102.up_proj", "model.layers.66.mlp.experts.103.up_proj", "model.layers.66.mlp.experts.104.up_proj", "model.layers.66.mlp.experts.105.up_proj", "model.layers.66.mlp.experts.106.up_proj", "model.layers.66.mlp.experts.107.up_proj", "model.layers.66.mlp.experts.108.up_proj", "model.layers.66.mlp.experts.109.up_proj", "model.layers.66.mlp.experts.110.up_proj", "model.layers.66.mlp.experts.111.up_proj", "model.layers.66.mlp.experts.112.up_proj", "model.layers.66.mlp.experts.113.up_proj", "model.layers.66.mlp.experts.114.up_proj", "model.layers.66.mlp.experts.115.up_proj", "model.layers.66.mlp.experts.116.up_proj", "model.layers.66.mlp.experts.117.up_proj", "model.layers.66.mlp.experts.118.up_proj", "model.layers.66.mlp.experts.119.up_proj", "model.layers.66.mlp.experts.120.up_proj", "model.layers.66.mlp.experts.121.up_proj", "model.layers.66.mlp.experts.122.up_proj", "model.layers.66.mlp.experts.123.up_proj", "model.layers.66.mlp.experts.124.up_proj", "model.layers.66.mlp.experts.125.up_proj", "model.layers.66.mlp.experts.126.up_proj", "model.layers.66.mlp.experts.127.up_proj", "model.layers.66.mlp.experts.128.up_proj", "model.layers.66.mlp.experts.129.up_proj", "model.layers.66.mlp.experts.130.up_proj", "model.layers.66.mlp.experts.131.up_proj", "model.layers.66.mlp.experts.132.up_proj", "model.layers.66.mlp.experts.133.up_proj", "model.layers.66.mlp.experts.134.up_proj", "model.layers.66.mlp.experts.135.up_proj", "model.layers.66.mlp.experts.136.up_proj", "model.layers.66.mlp.experts.137.up_proj", "model.layers.66.mlp.experts.138.up_proj", "model.layers.66.mlp.experts.139.up_proj", "model.layers.66.mlp.experts.140.up_proj", "model.layers.66.mlp.experts.141.up_proj", "model.layers.66.mlp.experts.142.up_proj", "model.layers.66.mlp.experts.143.up_proj", "model.layers.66.mlp.experts.144.up_proj", "model.layers.66.mlp.experts.145.up_proj", "model.layers.66.mlp.experts.146.up_proj", "model.layers.66.mlp.experts.147.up_proj", "model.layers.66.mlp.experts.148.up_proj", "model.layers.66.mlp.experts.149.up_proj", "model.layers.66.mlp.experts.150.up_proj", "model.layers.66.mlp.experts.151.up_proj", "model.layers.66.mlp.experts.152.up_proj", "model.layers.66.mlp.experts.153.up_proj", "model.layers.66.mlp.experts.154.up_proj", "model.layers.66.mlp.experts.155.up_proj", "model.layers.66.mlp.experts.156.up_proj", "model.layers.66.mlp.experts.157.up_proj", "model.layers.66.mlp.experts.158.up_proj", "model.layers.66.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 3.5697361454381515e-06, "dbits": 2516582400 }, { "dkld": 5.933735519648292e-06, "dbits": 5033164800 } ] }, { "idx": 398, "layers": [ "model.layers.66.mlp.experts.0.down_proj", "model.layers.66.mlp.experts.1.down_proj", "model.layers.66.mlp.experts.2.down_proj", "model.layers.66.mlp.experts.3.down_proj", "model.layers.66.mlp.experts.4.down_proj", "model.layers.66.mlp.experts.5.down_proj", "model.layers.66.mlp.experts.6.down_proj", "model.layers.66.mlp.experts.7.down_proj", "model.layers.66.mlp.experts.8.down_proj", "model.layers.66.mlp.experts.9.down_proj", "model.layers.66.mlp.experts.10.down_proj", "model.layers.66.mlp.experts.11.down_proj", "model.layers.66.mlp.experts.12.down_proj", "model.layers.66.mlp.experts.13.down_proj", "model.layers.66.mlp.experts.14.down_proj", "model.layers.66.mlp.experts.15.down_proj", "model.layers.66.mlp.experts.16.down_proj", "model.layers.66.mlp.experts.17.down_proj", "model.layers.66.mlp.experts.18.down_proj", "model.layers.66.mlp.experts.19.down_proj", "model.layers.66.mlp.experts.20.down_proj", "model.layers.66.mlp.experts.21.down_proj", "model.layers.66.mlp.experts.22.down_proj", "model.layers.66.mlp.experts.23.down_proj", "model.layers.66.mlp.experts.24.down_proj", "model.layers.66.mlp.experts.25.down_proj", "model.layers.66.mlp.experts.26.down_proj", "model.layers.66.mlp.experts.27.down_proj", "model.layers.66.mlp.experts.28.down_proj", "model.layers.66.mlp.experts.29.down_proj", "model.layers.66.mlp.experts.30.down_proj", "model.layers.66.mlp.experts.31.down_proj", "model.layers.66.mlp.experts.32.down_proj", "model.layers.66.mlp.experts.33.down_proj", "model.layers.66.mlp.experts.34.down_proj", "model.layers.66.mlp.experts.35.down_proj", "model.layers.66.mlp.experts.36.down_proj", "model.layers.66.mlp.experts.37.down_proj", "model.layers.66.mlp.experts.38.down_proj", "model.layers.66.mlp.experts.39.down_proj", "model.layers.66.mlp.experts.40.down_proj", "model.layers.66.mlp.experts.41.down_proj", "model.layers.66.mlp.experts.42.down_proj", "model.layers.66.mlp.experts.43.down_proj", "model.layers.66.mlp.experts.44.down_proj", "model.layers.66.mlp.experts.45.down_proj", "model.layers.66.mlp.experts.46.down_proj", "model.layers.66.mlp.experts.47.down_proj", "model.layers.66.mlp.experts.48.down_proj", "model.layers.66.mlp.experts.49.down_proj", "model.layers.66.mlp.experts.50.down_proj", "model.layers.66.mlp.experts.51.down_proj", "model.layers.66.mlp.experts.52.down_proj", "model.layers.66.mlp.experts.53.down_proj", "model.layers.66.mlp.experts.54.down_proj", "model.layers.66.mlp.experts.55.down_proj", "model.layers.66.mlp.experts.56.down_proj", "model.layers.66.mlp.experts.57.down_proj", "model.layers.66.mlp.experts.58.down_proj", "model.layers.66.mlp.experts.59.down_proj", "model.layers.66.mlp.experts.60.down_proj", "model.layers.66.mlp.experts.61.down_proj", "model.layers.66.mlp.experts.62.down_proj", "model.layers.66.mlp.experts.63.down_proj", "model.layers.66.mlp.experts.64.down_proj", "model.layers.66.mlp.experts.65.down_proj", "model.layers.66.mlp.experts.66.down_proj", "model.layers.66.mlp.experts.67.down_proj", "model.layers.66.mlp.experts.68.down_proj", "model.layers.66.mlp.experts.69.down_proj", "model.layers.66.mlp.experts.70.down_proj", "model.layers.66.mlp.experts.71.down_proj", "model.layers.66.mlp.experts.72.down_proj", "model.layers.66.mlp.experts.73.down_proj", "model.layers.66.mlp.experts.74.down_proj", "model.layers.66.mlp.experts.75.down_proj", "model.layers.66.mlp.experts.76.down_proj", "model.layers.66.mlp.experts.77.down_proj", "model.layers.66.mlp.experts.78.down_proj", "model.layers.66.mlp.experts.79.down_proj", "model.layers.66.mlp.experts.80.down_proj", "model.layers.66.mlp.experts.81.down_proj", "model.layers.66.mlp.experts.82.down_proj", "model.layers.66.mlp.experts.83.down_proj", "model.layers.66.mlp.experts.84.down_proj", "model.layers.66.mlp.experts.85.down_proj", "model.layers.66.mlp.experts.86.down_proj", "model.layers.66.mlp.experts.87.down_proj", "model.layers.66.mlp.experts.88.down_proj", "model.layers.66.mlp.experts.89.down_proj", "model.layers.66.mlp.experts.90.down_proj", "model.layers.66.mlp.experts.91.down_proj", "model.layers.66.mlp.experts.92.down_proj", "model.layers.66.mlp.experts.93.down_proj", "model.layers.66.mlp.experts.94.down_proj", "model.layers.66.mlp.experts.95.down_proj", "model.layers.66.mlp.experts.96.down_proj", "model.layers.66.mlp.experts.97.down_proj", "model.layers.66.mlp.experts.98.down_proj", "model.layers.66.mlp.experts.99.down_proj", "model.layers.66.mlp.experts.100.down_proj", "model.layers.66.mlp.experts.101.down_proj", "model.layers.66.mlp.experts.102.down_proj", "model.layers.66.mlp.experts.103.down_proj", "model.layers.66.mlp.experts.104.down_proj", "model.layers.66.mlp.experts.105.down_proj", "model.layers.66.mlp.experts.106.down_proj", "model.layers.66.mlp.experts.107.down_proj", "model.layers.66.mlp.experts.108.down_proj", "model.layers.66.mlp.experts.109.down_proj", "model.layers.66.mlp.experts.110.down_proj", "model.layers.66.mlp.experts.111.down_proj", "model.layers.66.mlp.experts.112.down_proj", "model.layers.66.mlp.experts.113.down_proj", "model.layers.66.mlp.experts.114.down_proj", "model.layers.66.mlp.experts.115.down_proj", "model.layers.66.mlp.experts.116.down_proj", "model.layers.66.mlp.experts.117.down_proj", "model.layers.66.mlp.experts.118.down_proj", "model.layers.66.mlp.experts.119.down_proj", "model.layers.66.mlp.experts.120.down_proj", "model.layers.66.mlp.experts.121.down_proj", "model.layers.66.mlp.experts.122.down_proj", "model.layers.66.mlp.experts.123.down_proj", "model.layers.66.mlp.experts.124.down_proj", "model.layers.66.mlp.experts.125.down_proj", "model.layers.66.mlp.experts.126.down_proj", "model.layers.66.mlp.experts.127.down_proj", "model.layers.66.mlp.experts.128.down_proj", "model.layers.66.mlp.experts.129.down_proj", "model.layers.66.mlp.experts.130.down_proj", "model.layers.66.mlp.experts.131.down_proj", "model.layers.66.mlp.experts.132.down_proj", "model.layers.66.mlp.experts.133.down_proj", "model.layers.66.mlp.experts.134.down_proj", "model.layers.66.mlp.experts.135.down_proj", "model.layers.66.mlp.experts.136.down_proj", "model.layers.66.mlp.experts.137.down_proj", "model.layers.66.mlp.experts.138.down_proj", "model.layers.66.mlp.experts.139.down_proj", "model.layers.66.mlp.experts.140.down_proj", "model.layers.66.mlp.experts.141.down_proj", "model.layers.66.mlp.experts.142.down_proj", "model.layers.66.mlp.experts.143.down_proj", "model.layers.66.mlp.experts.144.down_proj", "model.layers.66.mlp.experts.145.down_proj", "model.layers.66.mlp.experts.146.down_proj", "model.layers.66.mlp.experts.147.down_proj", "model.layers.66.mlp.experts.148.down_proj", "model.layers.66.mlp.experts.149.down_proj", "model.layers.66.mlp.experts.150.down_proj", "model.layers.66.mlp.experts.151.down_proj", "model.layers.66.mlp.experts.152.down_proj", "model.layers.66.mlp.experts.153.down_proj", "model.layers.66.mlp.experts.154.down_proj", "model.layers.66.mlp.experts.155.down_proj", "model.layers.66.mlp.experts.156.down_proj", "model.layers.66.mlp.experts.157.down_proj", "model.layers.66.mlp.experts.158.down_proj", "model.layers.66.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -9.415647946297775e-06, "dbits": 1258291200 }, { "dkld": -7.143244147231331e-08, "dbits": 2516582400 } ] }, { "idx": 399, "layers": [ "model.layers.67.self_attn.q_proj" ], "candidates": [ { "dkld": -2.4313339963555336e-05, "dbits": 62914560 }, { "dkld": -2.8376048430799397e-05, "dbits": 125829120 } ] }, { "idx": 400, "layers": [ "model.layers.67.self_attn.k_proj", "model.layers.67.self_attn.v_proj" ], "candidates": [ { "dkld": 3.491668030619621e-05, "dbits": 10485760 }, { "dkld": 2.292306162417039e-05, "dbits": 20971520 } ] }, { "idx": 401, "layers": [ "model.layers.67.self_attn.o_proj" ], "candidates": [ { "dkld": 1.8125725910068946e-05, "dbits": 62914560 }, { "dkld": 1.8507428467274753e-05, "dbits": 125829120 } ] }, { "idx": 402, "layers": [ "model.layers.67.mlp.shared_experts.gate_proj", "model.layers.67.mlp.shared_experts.up_proj", "model.layers.67.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -3.949138335883513e-05, "dbits": 23592960 }, { "dkld": -1.8068403005598935e-05, "dbits": 47185920 } ] }, { "idx": 403, "layers": [ "model.layers.67.mlp.experts.0.gate_proj", "model.layers.67.mlp.experts.1.gate_proj", "model.layers.67.mlp.experts.2.gate_proj", "model.layers.67.mlp.experts.3.gate_proj", "model.layers.67.mlp.experts.4.gate_proj", "model.layers.67.mlp.experts.5.gate_proj", "model.layers.67.mlp.experts.6.gate_proj", "model.layers.67.mlp.experts.7.gate_proj", "model.layers.67.mlp.experts.8.gate_proj", "model.layers.67.mlp.experts.9.gate_proj", "model.layers.67.mlp.experts.10.gate_proj", "model.layers.67.mlp.experts.11.gate_proj", "model.layers.67.mlp.experts.12.gate_proj", "model.layers.67.mlp.experts.13.gate_proj", "model.layers.67.mlp.experts.14.gate_proj", "model.layers.67.mlp.experts.15.gate_proj", "model.layers.67.mlp.experts.16.gate_proj", "model.layers.67.mlp.experts.17.gate_proj", "model.layers.67.mlp.experts.18.gate_proj", "model.layers.67.mlp.experts.19.gate_proj", "model.layers.67.mlp.experts.20.gate_proj", "model.layers.67.mlp.experts.21.gate_proj", "model.layers.67.mlp.experts.22.gate_proj", "model.layers.67.mlp.experts.23.gate_proj", "model.layers.67.mlp.experts.24.gate_proj", "model.layers.67.mlp.experts.25.gate_proj", "model.layers.67.mlp.experts.26.gate_proj", "model.layers.67.mlp.experts.27.gate_proj", "model.layers.67.mlp.experts.28.gate_proj", "model.layers.67.mlp.experts.29.gate_proj", "model.layers.67.mlp.experts.30.gate_proj", "model.layers.67.mlp.experts.31.gate_proj", "model.layers.67.mlp.experts.32.gate_proj", "model.layers.67.mlp.experts.33.gate_proj", "model.layers.67.mlp.experts.34.gate_proj", "model.layers.67.mlp.experts.35.gate_proj", "model.layers.67.mlp.experts.36.gate_proj", "model.layers.67.mlp.experts.37.gate_proj", "model.layers.67.mlp.experts.38.gate_proj", "model.layers.67.mlp.experts.39.gate_proj", "model.layers.67.mlp.experts.40.gate_proj", "model.layers.67.mlp.experts.41.gate_proj", "model.layers.67.mlp.experts.42.gate_proj", "model.layers.67.mlp.experts.43.gate_proj", "model.layers.67.mlp.experts.44.gate_proj", "model.layers.67.mlp.experts.45.gate_proj", "model.layers.67.mlp.experts.46.gate_proj", "model.layers.67.mlp.experts.47.gate_proj", "model.layers.67.mlp.experts.48.gate_proj", "model.layers.67.mlp.experts.49.gate_proj", "model.layers.67.mlp.experts.50.gate_proj", "model.layers.67.mlp.experts.51.gate_proj", "model.layers.67.mlp.experts.52.gate_proj", "model.layers.67.mlp.experts.53.gate_proj", "model.layers.67.mlp.experts.54.gate_proj", "model.layers.67.mlp.experts.55.gate_proj", "model.layers.67.mlp.experts.56.gate_proj", "model.layers.67.mlp.experts.57.gate_proj", "model.layers.67.mlp.experts.58.gate_proj", "model.layers.67.mlp.experts.59.gate_proj", "model.layers.67.mlp.experts.60.gate_proj", "model.layers.67.mlp.experts.61.gate_proj", "model.layers.67.mlp.experts.62.gate_proj", "model.layers.67.mlp.experts.63.gate_proj", "model.layers.67.mlp.experts.64.gate_proj", "model.layers.67.mlp.experts.65.gate_proj", "model.layers.67.mlp.experts.66.gate_proj", "model.layers.67.mlp.experts.67.gate_proj", "model.layers.67.mlp.experts.68.gate_proj", "model.layers.67.mlp.experts.69.gate_proj", "model.layers.67.mlp.experts.70.gate_proj", "model.layers.67.mlp.experts.71.gate_proj", "model.layers.67.mlp.experts.72.gate_proj", "model.layers.67.mlp.experts.73.gate_proj", "model.layers.67.mlp.experts.74.gate_proj", "model.layers.67.mlp.experts.75.gate_proj", "model.layers.67.mlp.experts.76.gate_proj", "model.layers.67.mlp.experts.77.gate_proj", "model.layers.67.mlp.experts.78.gate_proj", "model.layers.67.mlp.experts.79.gate_proj", "model.layers.67.mlp.experts.80.gate_proj", "model.layers.67.mlp.experts.81.gate_proj", "model.layers.67.mlp.experts.82.gate_proj", "model.layers.67.mlp.experts.83.gate_proj", "model.layers.67.mlp.experts.84.gate_proj", "model.layers.67.mlp.experts.85.gate_proj", "model.layers.67.mlp.experts.86.gate_proj", "model.layers.67.mlp.experts.87.gate_proj", "model.layers.67.mlp.experts.88.gate_proj", "model.layers.67.mlp.experts.89.gate_proj", "model.layers.67.mlp.experts.90.gate_proj", "model.layers.67.mlp.experts.91.gate_proj", "model.layers.67.mlp.experts.92.gate_proj", "model.layers.67.mlp.experts.93.gate_proj", "model.layers.67.mlp.experts.94.gate_proj", "model.layers.67.mlp.experts.95.gate_proj", "model.layers.67.mlp.experts.96.gate_proj", "model.layers.67.mlp.experts.97.gate_proj", "model.layers.67.mlp.experts.98.gate_proj", "model.layers.67.mlp.experts.99.gate_proj", "model.layers.67.mlp.experts.100.gate_proj", "model.layers.67.mlp.experts.101.gate_proj", "model.layers.67.mlp.experts.102.gate_proj", "model.layers.67.mlp.experts.103.gate_proj", "model.layers.67.mlp.experts.104.gate_proj", "model.layers.67.mlp.experts.105.gate_proj", "model.layers.67.mlp.experts.106.gate_proj", "model.layers.67.mlp.experts.107.gate_proj", "model.layers.67.mlp.experts.108.gate_proj", "model.layers.67.mlp.experts.109.gate_proj", "model.layers.67.mlp.experts.110.gate_proj", "model.layers.67.mlp.experts.111.gate_proj", "model.layers.67.mlp.experts.112.gate_proj", "model.layers.67.mlp.experts.113.gate_proj", "model.layers.67.mlp.experts.114.gate_proj", "model.layers.67.mlp.experts.115.gate_proj", "model.layers.67.mlp.experts.116.gate_proj", "model.layers.67.mlp.experts.117.gate_proj", "model.layers.67.mlp.experts.118.gate_proj", "model.layers.67.mlp.experts.119.gate_proj", "model.layers.67.mlp.experts.120.gate_proj", "model.layers.67.mlp.experts.121.gate_proj", "model.layers.67.mlp.experts.122.gate_proj", "model.layers.67.mlp.experts.123.gate_proj", "model.layers.67.mlp.experts.124.gate_proj", "model.layers.67.mlp.experts.125.gate_proj", "model.layers.67.mlp.experts.126.gate_proj", "model.layers.67.mlp.experts.127.gate_proj", "model.layers.67.mlp.experts.128.gate_proj", "model.layers.67.mlp.experts.129.gate_proj", "model.layers.67.mlp.experts.130.gate_proj", "model.layers.67.mlp.experts.131.gate_proj", "model.layers.67.mlp.experts.132.gate_proj", "model.layers.67.mlp.experts.133.gate_proj", "model.layers.67.mlp.experts.134.gate_proj", "model.layers.67.mlp.experts.135.gate_proj", "model.layers.67.mlp.experts.136.gate_proj", "model.layers.67.mlp.experts.137.gate_proj", "model.layers.67.mlp.experts.138.gate_proj", "model.layers.67.mlp.experts.139.gate_proj", "model.layers.67.mlp.experts.140.gate_proj", "model.layers.67.mlp.experts.141.gate_proj", "model.layers.67.mlp.experts.142.gate_proj", "model.layers.67.mlp.experts.143.gate_proj", "model.layers.67.mlp.experts.144.gate_proj", "model.layers.67.mlp.experts.145.gate_proj", "model.layers.67.mlp.experts.146.gate_proj", "model.layers.67.mlp.experts.147.gate_proj", "model.layers.67.mlp.experts.148.gate_proj", "model.layers.67.mlp.experts.149.gate_proj", "model.layers.67.mlp.experts.150.gate_proj", "model.layers.67.mlp.experts.151.gate_proj", "model.layers.67.mlp.experts.152.gate_proj", "model.layers.67.mlp.experts.153.gate_proj", "model.layers.67.mlp.experts.154.gate_proj", "model.layers.67.mlp.experts.155.gate_proj", "model.layers.67.mlp.experts.156.gate_proj", "model.layers.67.mlp.experts.157.gate_proj", "model.layers.67.mlp.experts.158.gate_proj", "model.layers.67.mlp.experts.159.gate_proj", "model.layers.67.mlp.experts.0.up_proj", "model.layers.67.mlp.experts.1.up_proj", "model.layers.67.mlp.experts.2.up_proj", "model.layers.67.mlp.experts.3.up_proj", "model.layers.67.mlp.experts.4.up_proj", "model.layers.67.mlp.experts.5.up_proj", "model.layers.67.mlp.experts.6.up_proj", "model.layers.67.mlp.experts.7.up_proj", "model.layers.67.mlp.experts.8.up_proj", "model.layers.67.mlp.experts.9.up_proj", "model.layers.67.mlp.experts.10.up_proj", "model.layers.67.mlp.experts.11.up_proj", "model.layers.67.mlp.experts.12.up_proj", "model.layers.67.mlp.experts.13.up_proj", "model.layers.67.mlp.experts.14.up_proj", "model.layers.67.mlp.experts.15.up_proj", "model.layers.67.mlp.experts.16.up_proj", "model.layers.67.mlp.experts.17.up_proj", "model.layers.67.mlp.experts.18.up_proj", "model.layers.67.mlp.experts.19.up_proj", "model.layers.67.mlp.experts.20.up_proj", "model.layers.67.mlp.experts.21.up_proj", "model.layers.67.mlp.experts.22.up_proj", "model.layers.67.mlp.experts.23.up_proj", "model.layers.67.mlp.experts.24.up_proj", "model.layers.67.mlp.experts.25.up_proj", "model.layers.67.mlp.experts.26.up_proj", "model.layers.67.mlp.experts.27.up_proj", "model.layers.67.mlp.experts.28.up_proj", "model.layers.67.mlp.experts.29.up_proj", "model.layers.67.mlp.experts.30.up_proj", "model.layers.67.mlp.experts.31.up_proj", "model.layers.67.mlp.experts.32.up_proj", "model.layers.67.mlp.experts.33.up_proj", "model.layers.67.mlp.experts.34.up_proj", "model.layers.67.mlp.experts.35.up_proj", "model.layers.67.mlp.experts.36.up_proj", "model.layers.67.mlp.experts.37.up_proj", "model.layers.67.mlp.experts.38.up_proj", "model.layers.67.mlp.experts.39.up_proj", "model.layers.67.mlp.experts.40.up_proj", "model.layers.67.mlp.experts.41.up_proj", "model.layers.67.mlp.experts.42.up_proj", "model.layers.67.mlp.experts.43.up_proj", "model.layers.67.mlp.experts.44.up_proj", "model.layers.67.mlp.experts.45.up_proj", "model.layers.67.mlp.experts.46.up_proj", "model.layers.67.mlp.experts.47.up_proj", "model.layers.67.mlp.experts.48.up_proj", "model.layers.67.mlp.experts.49.up_proj", "model.layers.67.mlp.experts.50.up_proj", "model.layers.67.mlp.experts.51.up_proj", "model.layers.67.mlp.experts.52.up_proj", "model.layers.67.mlp.experts.53.up_proj", "model.layers.67.mlp.experts.54.up_proj", "model.layers.67.mlp.experts.55.up_proj", "model.layers.67.mlp.experts.56.up_proj", "model.layers.67.mlp.experts.57.up_proj", "model.layers.67.mlp.experts.58.up_proj", "model.layers.67.mlp.experts.59.up_proj", "model.layers.67.mlp.experts.60.up_proj", "model.layers.67.mlp.experts.61.up_proj", "model.layers.67.mlp.experts.62.up_proj", "model.layers.67.mlp.experts.63.up_proj", "model.layers.67.mlp.experts.64.up_proj", "model.layers.67.mlp.experts.65.up_proj", "model.layers.67.mlp.experts.66.up_proj", "model.layers.67.mlp.experts.67.up_proj", "model.layers.67.mlp.experts.68.up_proj", "model.layers.67.mlp.experts.69.up_proj", "model.layers.67.mlp.experts.70.up_proj", "model.layers.67.mlp.experts.71.up_proj", "model.layers.67.mlp.experts.72.up_proj", "model.layers.67.mlp.experts.73.up_proj", "model.layers.67.mlp.experts.74.up_proj", "model.layers.67.mlp.experts.75.up_proj", "model.layers.67.mlp.experts.76.up_proj", "model.layers.67.mlp.experts.77.up_proj", "model.layers.67.mlp.experts.78.up_proj", "model.layers.67.mlp.experts.79.up_proj", "model.layers.67.mlp.experts.80.up_proj", "model.layers.67.mlp.experts.81.up_proj", "model.layers.67.mlp.experts.82.up_proj", "model.layers.67.mlp.experts.83.up_proj", "model.layers.67.mlp.experts.84.up_proj", "model.layers.67.mlp.experts.85.up_proj", "model.layers.67.mlp.experts.86.up_proj", "model.layers.67.mlp.experts.87.up_proj", "model.layers.67.mlp.experts.88.up_proj", "model.layers.67.mlp.experts.89.up_proj", "model.layers.67.mlp.experts.90.up_proj", "model.layers.67.mlp.experts.91.up_proj", "model.layers.67.mlp.experts.92.up_proj", "model.layers.67.mlp.experts.93.up_proj", "model.layers.67.mlp.experts.94.up_proj", "model.layers.67.mlp.experts.95.up_proj", "model.layers.67.mlp.experts.96.up_proj", "model.layers.67.mlp.experts.97.up_proj", "model.layers.67.mlp.experts.98.up_proj", "model.layers.67.mlp.experts.99.up_proj", "model.layers.67.mlp.experts.100.up_proj", "model.layers.67.mlp.experts.101.up_proj", "model.layers.67.mlp.experts.102.up_proj", "model.layers.67.mlp.experts.103.up_proj", "model.layers.67.mlp.experts.104.up_proj", "model.layers.67.mlp.experts.105.up_proj", "model.layers.67.mlp.experts.106.up_proj", "model.layers.67.mlp.experts.107.up_proj", "model.layers.67.mlp.experts.108.up_proj", "model.layers.67.mlp.experts.109.up_proj", "model.layers.67.mlp.experts.110.up_proj", "model.layers.67.mlp.experts.111.up_proj", "model.layers.67.mlp.experts.112.up_proj", "model.layers.67.mlp.experts.113.up_proj", "model.layers.67.mlp.experts.114.up_proj", "model.layers.67.mlp.experts.115.up_proj", "model.layers.67.mlp.experts.116.up_proj", "model.layers.67.mlp.experts.117.up_proj", "model.layers.67.mlp.experts.118.up_proj", "model.layers.67.mlp.experts.119.up_proj", "model.layers.67.mlp.experts.120.up_proj", "model.layers.67.mlp.experts.121.up_proj", "model.layers.67.mlp.experts.122.up_proj", "model.layers.67.mlp.experts.123.up_proj", "model.layers.67.mlp.experts.124.up_proj", "model.layers.67.mlp.experts.125.up_proj", "model.layers.67.mlp.experts.126.up_proj", "model.layers.67.mlp.experts.127.up_proj", "model.layers.67.mlp.experts.128.up_proj", "model.layers.67.mlp.experts.129.up_proj", "model.layers.67.mlp.experts.130.up_proj", "model.layers.67.mlp.experts.131.up_proj", "model.layers.67.mlp.experts.132.up_proj", "model.layers.67.mlp.experts.133.up_proj", "model.layers.67.mlp.experts.134.up_proj", "model.layers.67.mlp.experts.135.up_proj", "model.layers.67.mlp.experts.136.up_proj", "model.layers.67.mlp.experts.137.up_proj", "model.layers.67.mlp.experts.138.up_proj", "model.layers.67.mlp.experts.139.up_proj", "model.layers.67.mlp.experts.140.up_proj", "model.layers.67.mlp.experts.141.up_proj", "model.layers.67.mlp.experts.142.up_proj", "model.layers.67.mlp.experts.143.up_proj", "model.layers.67.mlp.experts.144.up_proj", "model.layers.67.mlp.experts.145.up_proj", "model.layers.67.mlp.experts.146.up_proj", "model.layers.67.mlp.experts.147.up_proj", "model.layers.67.mlp.experts.148.up_proj", "model.layers.67.mlp.experts.149.up_proj", "model.layers.67.mlp.experts.150.up_proj", "model.layers.67.mlp.experts.151.up_proj", "model.layers.67.mlp.experts.152.up_proj", "model.layers.67.mlp.experts.153.up_proj", "model.layers.67.mlp.experts.154.up_proj", "model.layers.67.mlp.experts.155.up_proj", "model.layers.67.mlp.experts.156.up_proj", "model.layers.67.mlp.experts.157.up_proj", "model.layers.67.mlp.experts.158.up_proj", "model.layers.67.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -7.554260082542202e-06, "dbits": 2516582400 }, { "dkld": 1.5123630873858929e-05, "dbits": 5033164800 } ] }, { "idx": 404, "layers": [ "model.layers.67.mlp.experts.0.down_proj", "model.layers.67.mlp.experts.1.down_proj", "model.layers.67.mlp.experts.2.down_proj", "model.layers.67.mlp.experts.3.down_proj", "model.layers.67.mlp.experts.4.down_proj", "model.layers.67.mlp.experts.5.down_proj", "model.layers.67.mlp.experts.6.down_proj", "model.layers.67.mlp.experts.7.down_proj", "model.layers.67.mlp.experts.8.down_proj", "model.layers.67.mlp.experts.9.down_proj", "model.layers.67.mlp.experts.10.down_proj", "model.layers.67.mlp.experts.11.down_proj", "model.layers.67.mlp.experts.12.down_proj", "model.layers.67.mlp.experts.13.down_proj", "model.layers.67.mlp.experts.14.down_proj", "model.layers.67.mlp.experts.15.down_proj", "model.layers.67.mlp.experts.16.down_proj", "model.layers.67.mlp.experts.17.down_proj", "model.layers.67.mlp.experts.18.down_proj", "model.layers.67.mlp.experts.19.down_proj", "model.layers.67.mlp.experts.20.down_proj", "model.layers.67.mlp.experts.21.down_proj", "model.layers.67.mlp.experts.22.down_proj", "model.layers.67.mlp.experts.23.down_proj", "model.layers.67.mlp.experts.24.down_proj", "model.layers.67.mlp.experts.25.down_proj", "model.layers.67.mlp.experts.26.down_proj", "model.layers.67.mlp.experts.27.down_proj", "model.layers.67.mlp.experts.28.down_proj", "model.layers.67.mlp.experts.29.down_proj", "model.layers.67.mlp.experts.30.down_proj", "model.layers.67.mlp.experts.31.down_proj", "model.layers.67.mlp.experts.32.down_proj", "model.layers.67.mlp.experts.33.down_proj", "model.layers.67.mlp.experts.34.down_proj", "model.layers.67.mlp.experts.35.down_proj", "model.layers.67.mlp.experts.36.down_proj", "model.layers.67.mlp.experts.37.down_proj", "model.layers.67.mlp.experts.38.down_proj", "model.layers.67.mlp.experts.39.down_proj", "model.layers.67.mlp.experts.40.down_proj", "model.layers.67.mlp.experts.41.down_proj", "model.layers.67.mlp.experts.42.down_proj", "model.layers.67.mlp.experts.43.down_proj", "model.layers.67.mlp.experts.44.down_proj", "model.layers.67.mlp.experts.45.down_proj", "model.layers.67.mlp.experts.46.down_proj", "model.layers.67.mlp.experts.47.down_proj", "model.layers.67.mlp.experts.48.down_proj", "model.layers.67.mlp.experts.49.down_proj", "model.layers.67.mlp.experts.50.down_proj", "model.layers.67.mlp.experts.51.down_proj", "model.layers.67.mlp.experts.52.down_proj", "model.layers.67.mlp.experts.53.down_proj", "model.layers.67.mlp.experts.54.down_proj", "model.layers.67.mlp.experts.55.down_proj", "model.layers.67.mlp.experts.56.down_proj", "model.layers.67.mlp.experts.57.down_proj", "model.layers.67.mlp.experts.58.down_proj", "model.layers.67.mlp.experts.59.down_proj", "model.layers.67.mlp.experts.60.down_proj", "model.layers.67.mlp.experts.61.down_proj", "model.layers.67.mlp.experts.62.down_proj", "model.layers.67.mlp.experts.63.down_proj", "model.layers.67.mlp.experts.64.down_proj", "model.layers.67.mlp.experts.65.down_proj", "model.layers.67.mlp.experts.66.down_proj", "model.layers.67.mlp.experts.67.down_proj", "model.layers.67.mlp.experts.68.down_proj", "model.layers.67.mlp.experts.69.down_proj", "model.layers.67.mlp.experts.70.down_proj", "model.layers.67.mlp.experts.71.down_proj", "model.layers.67.mlp.experts.72.down_proj", "model.layers.67.mlp.experts.73.down_proj", "model.layers.67.mlp.experts.74.down_proj", "model.layers.67.mlp.experts.75.down_proj", "model.layers.67.mlp.experts.76.down_proj", "model.layers.67.mlp.experts.77.down_proj", "model.layers.67.mlp.experts.78.down_proj", "model.layers.67.mlp.experts.79.down_proj", "model.layers.67.mlp.experts.80.down_proj", "model.layers.67.mlp.experts.81.down_proj", "model.layers.67.mlp.experts.82.down_proj", "model.layers.67.mlp.experts.83.down_proj", "model.layers.67.mlp.experts.84.down_proj", "model.layers.67.mlp.experts.85.down_proj", "model.layers.67.mlp.experts.86.down_proj", "model.layers.67.mlp.experts.87.down_proj", "model.layers.67.mlp.experts.88.down_proj", "model.layers.67.mlp.experts.89.down_proj", "model.layers.67.mlp.experts.90.down_proj", "model.layers.67.mlp.experts.91.down_proj", "model.layers.67.mlp.experts.92.down_proj", "model.layers.67.mlp.experts.93.down_proj", "model.layers.67.mlp.experts.94.down_proj", "model.layers.67.mlp.experts.95.down_proj", "model.layers.67.mlp.experts.96.down_proj", "model.layers.67.mlp.experts.97.down_proj", "model.layers.67.mlp.experts.98.down_proj", "model.layers.67.mlp.experts.99.down_proj", "model.layers.67.mlp.experts.100.down_proj", "model.layers.67.mlp.experts.101.down_proj", "model.layers.67.mlp.experts.102.down_proj", "model.layers.67.mlp.experts.103.down_proj", "model.layers.67.mlp.experts.104.down_proj", "model.layers.67.mlp.experts.105.down_proj", "model.layers.67.mlp.experts.106.down_proj", "model.layers.67.mlp.experts.107.down_proj", "model.layers.67.mlp.experts.108.down_proj", "model.layers.67.mlp.experts.109.down_proj", "model.layers.67.mlp.experts.110.down_proj", "model.layers.67.mlp.experts.111.down_proj", "model.layers.67.mlp.experts.112.down_proj", "model.layers.67.mlp.experts.113.down_proj", "model.layers.67.mlp.experts.114.down_proj", "model.layers.67.mlp.experts.115.down_proj", "model.layers.67.mlp.experts.116.down_proj", "model.layers.67.mlp.experts.117.down_proj", "model.layers.67.mlp.experts.118.down_proj", "model.layers.67.mlp.experts.119.down_proj", "model.layers.67.mlp.experts.120.down_proj", "model.layers.67.mlp.experts.121.down_proj", "model.layers.67.mlp.experts.122.down_proj", "model.layers.67.mlp.experts.123.down_proj", "model.layers.67.mlp.experts.124.down_proj", "model.layers.67.mlp.experts.125.down_proj", "model.layers.67.mlp.experts.126.down_proj", "model.layers.67.mlp.experts.127.down_proj", "model.layers.67.mlp.experts.128.down_proj", "model.layers.67.mlp.experts.129.down_proj", "model.layers.67.mlp.experts.130.down_proj", "model.layers.67.mlp.experts.131.down_proj", "model.layers.67.mlp.experts.132.down_proj", "model.layers.67.mlp.experts.133.down_proj", "model.layers.67.mlp.experts.134.down_proj", "model.layers.67.mlp.experts.135.down_proj", "model.layers.67.mlp.experts.136.down_proj", "model.layers.67.mlp.experts.137.down_proj", "model.layers.67.mlp.experts.138.down_proj", "model.layers.67.mlp.experts.139.down_proj", "model.layers.67.mlp.experts.140.down_proj", "model.layers.67.mlp.experts.141.down_proj", "model.layers.67.mlp.experts.142.down_proj", "model.layers.67.mlp.experts.143.down_proj", "model.layers.67.mlp.experts.144.down_proj", "model.layers.67.mlp.experts.145.down_proj", "model.layers.67.mlp.experts.146.down_proj", "model.layers.67.mlp.experts.147.down_proj", "model.layers.67.mlp.experts.148.down_proj", "model.layers.67.mlp.experts.149.down_proj", "model.layers.67.mlp.experts.150.down_proj", "model.layers.67.mlp.experts.151.down_proj", "model.layers.67.mlp.experts.152.down_proj", "model.layers.67.mlp.experts.153.down_proj", "model.layers.67.mlp.experts.154.down_proj", "model.layers.67.mlp.experts.155.down_proj", "model.layers.67.mlp.experts.156.down_proj", "model.layers.67.mlp.experts.157.down_proj", "model.layers.67.mlp.experts.158.down_proj", "model.layers.67.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 2.8103590011610557e-06, "dbits": 1258291200 }, { "dkld": 3.744917921722976e-06, "dbits": 2516582400 } ] }, { "idx": 405, "layers": [ "model.layers.68.self_attn.q_proj" ], "candidates": [ { "dkld": -1.6283709555857395e-06, "dbits": 62914560 }, { "dkld": -1.2610759586095116e-05, "dbits": 125829120 } ] }, { "idx": 406, "layers": [ "model.layers.68.self_attn.k_proj", "model.layers.68.self_attn.v_proj" ], "candidates": [ { "dkld": 7.154920604079962e-05, "dbits": 10485760 }, { "dkld": 2.9708677902818767e-05, "dbits": 20971520 } ] }, { "idx": 407, "layers": [ "model.layers.68.self_attn.o_proj" ], "candidates": [ { "dkld": -2.59914668276906e-05, "dbits": 62914560 }, { "dkld": -4.788036458194117e-05, "dbits": 125829120 } ] }, { "idx": 408, "layers": [ "model.layers.68.mlp.shared_experts.gate_proj", "model.layers.68.mlp.shared_experts.up_proj", "model.layers.68.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -8.570728823542595e-06, "dbits": 23592960 }, { "dkld": -1.718241255730356e-05, "dbits": 47185920 } ] }, { "idx": 409, "layers": [ "model.layers.68.mlp.experts.0.gate_proj", "model.layers.68.mlp.experts.1.gate_proj", "model.layers.68.mlp.experts.2.gate_proj", "model.layers.68.mlp.experts.3.gate_proj", "model.layers.68.mlp.experts.4.gate_proj", "model.layers.68.mlp.experts.5.gate_proj", "model.layers.68.mlp.experts.6.gate_proj", "model.layers.68.mlp.experts.7.gate_proj", "model.layers.68.mlp.experts.8.gate_proj", "model.layers.68.mlp.experts.9.gate_proj", "model.layers.68.mlp.experts.10.gate_proj", "model.layers.68.mlp.experts.11.gate_proj", "model.layers.68.mlp.experts.12.gate_proj", "model.layers.68.mlp.experts.13.gate_proj", "model.layers.68.mlp.experts.14.gate_proj", "model.layers.68.mlp.experts.15.gate_proj", "model.layers.68.mlp.experts.16.gate_proj", "model.layers.68.mlp.experts.17.gate_proj", "model.layers.68.mlp.experts.18.gate_proj", "model.layers.68.mlp.experts.19.gate_proj", "model.layers.68.mlp.experts.20.gate_proj", "model.layers.68.mlp.experts.21.gate_proj", "model.layers.68.mlp.experts.22.gate_proj", "model.layers.68.mlp.experts.23.gate_proj", "model.layers.68.mlp.experts.24.gate_proj", "model.layers.68.mlp.experts.25.gate_proj", "model.layers.68.mlp.experts.26.gate_proj", "model.layers.68.mlp.experts.27.gate_proj", "model.layers.68.mlp.experts.28.gate_proj", "model.layers.68.mlp.experts.29.gate_proj", "model.layers.68.mlp.experts.30.gate_proj", "model.layers.68.mlp.experts.31.gate_proj", "model.layers.68.mlp.experts.32.gate_proj", "model.layers.68.mlp.experts.33.gate_proj", "model.layers.68.mlp.experts.34.gate_proj", "model.layers.68.mlp.experts.35.gate_proj", "model.layers.68.mlp.experts.36.gate_proj", "model.layers.68.mlp.experts.37.gate_proj", "model.layers.68.mlp.experts.38.gate_proj", "model.layers.68.mlp.experts.39.gate_proj", "model.layers.68.mlp.experts.40.gate_proj", "model.layers.68.mlp.experts.41.gate_proj", "model.layers.68.mlp.experts.42.gate_proj", "model.layers.68.mlp.experts.43.gate_proj", "model.layers.68.mlp.experts.44.gate_proj", "model.layers.68.mlp.experts.45.gate_proj", "model.layers.68.mlp.experts.46.gate_proj", "model.layers.68.mlp.experts.47.gate_proj", "model.layers.68.mlp.experts.48.gate_proj", "model.layers.68.mlp.experts.49.gate_proj", "model.layers.68.mlp.experts.50.gate_proj", "model.layers.68.mlp.experts.51.gate_proj", "model.layers.68.mlp.experts.52.gate_proj", "model.layers.68.mlp.experts.53.gate_proj", "model.layers.68.mlp.experts.54.gate_proj", "model.layers.68.mlp.experts.55.gate_proj", "model.layers.68.mlp.experts.56.gate_proj", "model.layers.68.mlp.experts.57.gate_proj", "model.layers.68.mlp.experts.58.gate_proj", "model.layers.68.mlp.experts.59.gate_proj", "model.layers.68.mlp.experts.60.gate_proj", "model.layers.68.mlp.experts.61.gate_proj", "model.layers.68.mlp.experts.62.gate_proj", "model.layers.68.mlp.experts.63.gate_proj", "model.layers.68.mlp.experts.64.gate_proj", "model.layers.68.mlp.experts.65.gate_proj", "model.layers.68.mlp.experts.66.gate_proj", "model.layers.68.mlp.experts.67.gate_proj", "model.layers.68.mlp.experts.68.gate_proj", "model.layers.68.mlp.experts.69.gate_proj", "model.layers.68.mlp.experts.70.gate_proj", "model.layers.68.mlp.experts.71.gate_proj", "model.layers.68.mlp.experts.72.gate_proj", "model.layers.68.mlp.experts.73.gate_proj", "model.layers.68.mlp.experts.74.gate_proj", "model.layers.68.mlp.experts.75.gate_proj", "model.layers.68.mlp.experts.76.gate_proj", "model.layers.68.mlp.experts.77.gate_proj", "model.layers.68.mlp.experts.78.gate_proj", "model.layers.68.mlp.experts.79.gate_proj", "model.layers.68.mlp.experts.80.gate_proj", "model.layers.68.mlp.experts.81.gate_proj", "model.layers.68.mlp.experts.82.gate_proj", "model.layers.68.mlp.experts.83.gate_proj", "model.layers.68.mlp.experts.84.gate_proj", "model.layers.68.mlp.experts.85.gate_proj", "model.layers.68.mlp.experts.86.gate_proj", "model.layers.68.mlp.experts.87.gate_proj", "model.layers.68.mlp.experts.88.gate_proj", "model.layers.68.mlp.experts.89.gate_proj", "model.layers.68.mlp.experts.90.gate_proj", "model.layers.68.mlp.experts.91.gate_proj", "model.layers.68.mlp.experts.92.gate_proj", "model.layers.68.mlp.experts.93.gate_proj", "model.layers.68.mlp.experts.94.gate_proj", "model.layers.68.mlp.experts.95.gate_proj", "model.layers.68.mlp.experts.96.gate_proj", "model.layers.68.mlp.experts.97.gate_proj", "model.layers.68.mlp.experts.98.gate_proj", "model.layers.68.mlp.experts.99.gate_proj", "model.layers.68.mlp.experts.100.gate_proj", "model.layers.68.mlp.experts.101.gate_proj", "model.layers.68.mlp.experts.102.gate_proj", "model.layers.68.mlp.experts.103.gate_proj", "model.layers.68.mlp.experts.104.gate_proj", "model.layers.68.mlp.experts.105.gate_proj", "model.layers.68.mlp.experts.106.gate_proj", "model.layers.68.mlp.experts.107.gate_proj", "model.layers.68.mlp.experts.108.gate_proj", "model.layers.68.mlp.experts.109.gate_proj", "model.layers.68.mlp.experts.110.gate_proj", "model.layers.68.mlp.experts.111.gate_proj", "model.layers.68.mlp.experts.112.gate_proj", "model.layers.68.mlp.experts.113.gate_proj", "model.layers.68.mlp.experts.114.gate_proj", "model.layers.68.mlp.experts.115.gate_proj", "model.layers.68.mlp.experts.116.gate_proj", "model.layers.68.mlp.experts.117.gate_proj", "model.layers.68.mlp.experts.118.gate_proj", "model.layers.68.mlp.experts.119.gate_proj", "model.layers.68.mlp.experts.120.gate_proj", "model.layers.68.mlp.experts.121.gate_proj", "model.layers.68.mlp.experts.122.gate_proj", "model.layers.68.mlp.experts.123.gate_proj", "model.layers.68.mlp.experts.124.gate_proj", "model.layers.68.mlp.experts.125.gate_proj", "model.layers.68.mlp.experts.126.gate_proj", "model.layers.68.mlp.experts.127.gate_proj", "model.layers.68.mlp.experts.128.gate_proj", "model.layers.68.mlp.experts.129.gate_proj", "model.layers.68.mlp.experts.130.gate_proj", "model.layers.68.mlp.experts.131.gate_proj", "model.layers.68.mlp.experts.132.gate_proj", "model.layers.68.mlp.experts.133.gate_proj", "model.layers.68.mlp.experts.134.gate_proj", "model.layers.68.mlp.experts.135.gate_proj", "model.layers.68.mlp.experts.136.gate_proj", "model.layers.68.mlp.experts.137.gate_proj", "model.layers.68.mlp.experts.138.gate_proj", "model.layers.68.mlp.experts.139.gate_proj", "model.layers.68.mlp.experts.140.gate_proj", "model.layers.68.mlp.experts.141.gate_proj", "model.layers.68.mlp.experts.142.gate_proj", "model.layers.68.mlp.experts.143.gate_proj", "model.layers.68.mlp.experts.144.gate_proj", "model.layers.68.mlp.experts.145.gate_proj", "model.layers.68.mlp.experts.146.gate_proj", "model.layers.68.mlp.experts.147.gate_proj", "model.layers.68.mlp.experts.148.gate_proj", "model.layers.68.mlp.experts.149.gate_proj", "model.layers.68.mlp.experts.150.gate_proj", "model.layers.68.mlp.experts.151.gate_proj", "model.layers.68.mlp.experts.152.gate_proj", "model.layers.68.mlp.experts.153.gate_proj", "model.layers.68.mlp.experts.154.gate_proj", "model.layers.68.mlp.experts.155.gate_proj", "model.layers.68.mlp.experts.156.gate_proj", "model.layers.68.mlp.experts.157.gate_proj", "model.layers.68.mlp.experts.158.gate_proj", "model.layers.68.mlp.experts.159.gate_proj", "model.layers.68.mlp.experts.0.up_proj", "model.layers.68.mlp.experts.1.up_proj", "model.layers.68.mlp.experts.2.up_proj", "model.layers.68.mlp.experts.3.up_proj", "model.layers.68.mlp.experts.4.up_proj", "model.layers.68.mlp.experts.5.up_proj", "model.layers.68.mlp.experts.6.up_proj", "model.layers.68.mlp.experts.7.up_proj", "model.layers.68.mlp.experts.8.up_proj", "model.layers.68.mlp.experts.9.up_proj", "model.layers.68.mlp.experts.10.up_proj", "model.layers.68.mlp.experts.11.up_proj", "model.layers.68.mlp.experts.12.up_proj", "model.layers.68.mlp.experts.13.up_proj", "model.layers.68.mlp.experts.14.up_proj", "model.layers.68.mlp.experts.15.up_proj", "model.layers.68.mlp.experts.16.up_proj", "model.layers.68.mlp.experts.17.up_proj", "model.layers.68.mlp.experts.18.up_proj", "model.layers.68.mlp.experts.19.up_proj", "model.layers.68.mlp.experts.20.up_proj", "model.layers.68.mlp.experts.21.up_proj", "model.layers.68.mlp.experts.22.up_proj", "model.layers.68.mlp.experts.23.up_proj", "model.layers.68.mlp.experts.24.up_proj", "model.layers.68.mlp.experts.25.up_proj", "model.layers.68.mlp.experts.26.up_proj", "model.layers.68.mlp.experts.27.up_proj", "model.layers.68.mlp.experts.28.up_proj", "model.layers.68.mlp.experts.29.up_proj", "model.layers.68.mlp.experts.30.up_proj", "model.layers.68.mlp.experts.31.up_proj", "model.layers.68.mlp.experts.32.up_proj", "model.layers.68.mlp.experts.33.up_proj", "model.layers.68.mlp.experts.34.up_proj", "model.layers.68.mlp.experts.35.up_proj", "model.layers.68.mlp.experts.36.up_proj", "model.layers.68.mlp.experts.37.up_proj", "model.layers.68.mlp.experts.38.up_proj", "model.layers.68.mlp.experts.39.up_proj", "model.layers.68.mlp.experts.40.up_proj", "model.layers.68.mlp.experts.41.up_proj", "model.layers.68.mlp.experts.42.up_proj", "model.layers.68.mlp.experts.43.up_proj", "model.layers.68.mlp.experts.44.up_proj", "model.layers.68.mlp.experts.45.up_proj", "model.layers.68.mlp.experts.46.up_proj", "model.layers.68.mlp.experts.47.up_proj", "model.layers.68.mlp.experts.48.up_proj", "model.layers.68.mlp.experts.49.up_proj", "model.layers.68.mlp.experts.50.up_proj", "model.layers.68.mlp.experts.51.up_proj", "model.layers.68.mlp.experts.52.up_proj", "model.layers.68.mlp.experts.53.up_proj", "model.layers.68.mlp.experts.54.up_proj", "model.layers.68.mlp.experts.55.up_proj", "model.layers.68.mlp.experts.56.up_proj", "model.layers.68.mlp.experts.57.up_proj", "model.layers.68.mlp.experts.58.up_proj", "model.layers.68.mlp.experts.59.up_proj", "model.layers.68.mlp.experts.60.up_proj", "model.layers.68.mlp.experts.61.up_proj", "model.layers.68.mlp.experts.62.up_proj", "model.layers.68.mlp.experts.63.up_proj", "model.layers.68.mlp.experts.64.up_proj", "model.layers.68.mlp.experts.65.up_proj", "model.layers.68.mlp.experts.66.up_proj", "model.layers.68.mlp.experts.67.up_proj", "model.layers.68.mlp.experts.68.up_proj", "model.layers.68.mlp.experts.69.up_proj", "model.layers.68.mlp.experts.70.up_proj", "model.layers.68.mlp.experts.71.up_proj", "model.layers.68.mlp.experts.72.up_proj", "model.layers.68.mlp.experts.73.up_proj", "model.layers.68.mlp.experts.74.up_proj", "model.layers.68.mlp.experts.75.up_proj", "model.layers.68.mlp.experts.76.up_proj", "model.layers.68.mlp.experts.77.up_proj", "model.layers.68.mlp.experts.78.up_proj", "model.layers.68.mlp.experts.79.up_proj", "model.layers.68.mlp.experts.80.up_proj", "model.layers.68.mlp.experts.81.up_proj", "model.layers.68.mlp.experts.82.up_proj", "model.layers.68.mlp.experts.83.up_proj", "model.layers.68.mlp.experts.84.up_proj", "model.layers.68.mlp.experts.85.up_proj", "model.layers.68.mlp.experts.86.up_proj", "model.layers.68.mlp.experts.87.up_proj", "model.layers.68.mlp.experts.88.up_proj", "model.layers.68.mlp.experts.89.up_proj", "model.layers.68.mlp.experts.90.up_proj", "model.layers.68.mlp.experts.91.up_proj", "model.layers.68.mlp.experts.92.up_proj", "model.layers.68.mlp.experts.93.up_proj", "model.layers.68.mlp.experts.94.up_proj", "model.layers.68.mlp.experts.95.up_proj", "model.layers.68.mlp.experts.96.up_proj", "model.layers.68.mlp.experts.97.up_proj", "model.layers.68.mlp.experts.98.up_proj", "model.layers.68.mlp.experts.99.up_proj", "model.layers.68.mlp.experts.100.up_proj", "model.layers.68.mlp.experts.101.up_proj", "model.layers.68.mlp.experts.102.up_proj", "model.layers.68.mlp.experts.103.up_proj", "model.layers.68.mlp.experts.104.up_proj", "model.layers.68.mlp.experts.105.up_proj", "model.layers.68.mlp.experts.106.up_proj", "model.layers.68.mlp.experts.107.up_proj", "model.layers.68.mlp.experts.108.up_proj", "model.layers.68.mlp.experts.109.up_proj", "model.layers.68.mlp.experts.110.up_proj", "model.layers.68.mlp.experts.111.up_proj", "model.layers.68.mlp.experts.112.up_proj", "model.layers.68.mlp.experts.113.up_proj", "model.layers.68.mlp.experts.114.up_proj", "model.layers.68.mlp.experts.115.up_proj", "model.layers.68.mlp.experts.116.up_proj", "model.layers.68.mlp.experts.117.up_proj", "model.layers.68.mlp.experts.118.up_proj", "model.layers.68.mlp.experts.119.up_proj", "model.layers.68.mlp.experts.120.up_proj", "model.layers.68.mlp.experts.121.up_proj", "model.layers.68.mlp.experts.122.up_proj", "model.layers.68.mlp.experts.123.up_proj", "model.layers.68.mlp.experts.124.up_proj", "model.layers.68.mlp.experts.125.up_proj", "model.layers.68.mlp.experts.126.up_proj", "model.layers.68.mlp.experts.127.up_proj", "model.layers.68.mlp.experts.128.up_proj", "model.layers.68.mlp.experts.129.up_proj", "model.layers.68.mlp.experts.130.up_proj", "model.layers.68.mlp.experts.131.up_proj", "model.layers.68.mlp.experts.132.up_proj", "model.layers.68.mlp.experts.133.up_proj", "model.layers.68.mlp.experts.134.up_proj", "model.layers.68.mlp.experts.135.up_proj", "model.layers.68.mlp.experts.136.up_proj", "model.layers.68.mlp.experts.137.up_proj", "model.layers.68.mlp.experts.138.up_proj", "model.layers.68.mlp.experts.139.up_proj", "model.layers.68.mlp.experts.140.up_proj", "model.layers.68.mlp.experts.141.up_proj", "model.layers.68.mlp.experts.142.up_proj", "model.layers.68.mlp.experts.143.up_proj", "model.layers.68.mlp.experts.144.up_proj", "model.layers.68.mlp.experts.145.up_proj", "model.layers.68.mlp.experts.146.up_proj", "model.layers.68.mlp.experts.147.up_proj", "model.layers.68.mlp.experts.148.up_proj", "model.layers.68.mlp.experts.149.up_proj", "model.layers.68.mlp.experts.150.up_proj", "model.layers.68.mlp.experts.151.up_proj", "model.layers.68.mlp.experts.152.up_proj", "model.layers.68.mlp.experts.153.up_proj", "model.layers.68.mlp.experts.154.up_proj", "model.layers.68.mlp.experts.155.up_proj", "model.layers.68.mlp.experts.156.up_proj", "model.layers.68.mlp.experts.157.up_proj", "model.layers.68.mlp.experts.158.up_proj", "model.layers.68.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 2.056094817817246e-05, "dbits": 2516582400 }, { "dkld": 1.7145858146251636e-05, "dbits": 5033164800 } ] }, { "idx": 410, "layers": [ "model.layers.68.mlp.experts.0.down_proj", "model.layers.68.mlp.experts.1.down_proj", "model.layers.68.mlp.experts.2.down_proj", "model.layers.68.mlp.experts.3.down_proj", "model.layers.68.mlp.experts.4.down_proj", "model.layers.68.mlp.experts.5.down_proj", "model.layers.68.mlp.experts.6.down_proj", "model.layers.68.mlp.experts.7.down_proj", "model.layers.68.mlp.experts.8.down_proj", "model.layers.68.mlp.experts.9.down_proj", "model.layers.68.mlp.experts.10.down_proj", "model.layers.68.mlp.experts.11.down_proj", "model.layers.68.mlp.experts.12.down_proj", "model.layers.68.mlp.experts.13.down_proj", "model.layers.68.mlp.experts.14.down_proj", "model.layers.68.mlp.experts.15.down_proj", "model.layers.68.mlp.experts.16.down_proj", "model.layers.68.mlp.experts.17.down_proj", "model.layers.68.mlp.experts.18.down_proj", "model.layers.68.mlp.experts.19.down_proj", "model.layers.68.mlp.experts.20.down_proj", "model.layers.68.mlp.experts.21.down_proj", "model.layers.68.mlp.experts.22.down_proj", "model.layers.68.mlp.experts.23.down_proj", "model.layers.68.mlp.experts.24.down_proj", "model.layers.68.mlp.experts.25.down_proj", "model.layers.68.mlp.experts.26.down_proj", "model.layers.68.mlp.experts.27.down_proj", "model.layers.68.mlp.experts.28.down_proj", "model.layers.68.mlp.experts.29.down_proj", "model.layers.68.mlp.experts.30.down_proj", "model.layers.68.mlp.experts.31.down_proj", "model.layers.68.mlp.experts.32.down_proj", "model.layers.68.mlp.experts.33.down_proj", "model.layers.68.mlp.experts.34.down_proj", "model.layers.68.mlp.experts.35.down_proj", "model.layers.68.mlp.experts.36.down_proj", "model.layers.68.mlp.experts.37.down_proj", "model.layers.68.mlp.experts.38.down_proj", "model.layers.68.mlp.experts.39.down_proj", "model.layers.68.mlp.experts.40.down_proj", "model.layers.68.mlp.experts.41.down_proj", "model.layers.68.mlp.experts.42.down_proj", "model.layers.68.mlp.experts.43.down_proj", "model.layers.68.mlp.experts.44.down_proj", "model.layers.68.mlp.experts.45.down_proj", "model.layers.68.mlp.experts.46.down_proj", "model.layers.68.mlp.experts.47.down_proj", "model.layers.68.mlp.experts.48.down_proj", "model.layers.68.mlp.experts.49.down_proj", "model.layers.68.mlp.experts.50.down_proj", "model.layers.68.mlp.experts.51.down_proj", "model.layers.68.mlp.experts.52.down_proj", "model.layers.68.mlp.experts.53.down_proj", "model.layers.68.mlp.experts.54.down_proj", "model.layers.68.mlp.experts.55.down_proj", "model.layers.68.mlp.experts.56.down_proj", "model.layers.68.mlp.experts.57.down_proj", "model.layers.68.mlp.experts.58.down_proj", "model.layers.68.mlp.experts.59.down_proj", "model.layers.68.mlp.experts.60.down_proj", "model.layers.68.mlp.experts.61.down_proj", "model.layers.68.mlp.experts.62.down_proj", "model.layers.68.mlp.experts.63.down_proj", "model.layers.68.mlp.experts.64.down_proj", "model.layers.68.mlp.experts.65.down_proj", "model.layers.68.mlp.experts.66.down_proj", "model.layers.68.mlp.experts.67.down_proj", "model.layers.68.mlp.experts.68.down_proj", "model.layers.68.mlp.experts.69.down_proj", "model.layers.68.mlp.experts.70.down_proj", "model.layers.68.mlp.experts.71.down_proj", "model.layers.68.mlp.experts.72.down_proj", "model.layers.68.mlp.experts.73.down_proj", "model.layers.68.mlp.experts.74.down_proj", "model.layers.68.mlp.experts.75.down_proj", "model.layers.68.mlp.experts.76.down_proj", "model.layers.68.mlp.experts.77.down_proj", "model.layers.68.mlp.experts.78.down_proj", "model.layers.68.mlp.experts.79.down_proj", "model.layers.68.mlp.experts.80.down_proj", "model.layers.68.mlp.experts.81.down_proj", "model.layers.68.mlp.experts.82.down_proj", "model.layers.68.mlp.experts.83.down_proj", "model.layers.68.mlp.experts.84.down_proj", "model.layers.68.mlp.experts.85.down_proj", "model.layers.68.mlp.experts.86.down_proj", "model.layers.68.mlp.experts.87.down_proj", "model.layers.68.mlp.experts.88.down_proj", "model.layers.68.mlp.experts.89.down_proj", "model.layers.68.mlp.experts.90.down_proj", "model.layers.68.mlp.experts.91.down_proj", "model.layers.68.mlp.experts.92.down_proj", "model.layers.68.mlp.experts.93.down_proj", "model.layers.68.mlp.experts.94.down_proj", "model.layers.68.mlp.experts.95.down_proj", "model.layers.68.mlp.experts.96.down_proj", "model.layers.68.mlp.experts.97.down_proj", "model.layers.68.mlp.experts.98.down_proj", "model.layers.68.mlp.experts.99.down_proj", "model.layers.68.mlp.experts.100.down_proj", "model.layers.68.mlp.experts.101.down_proj", "model.layers.68.mlp.experts.102.down_proj", "model.layers.68.mlp.experts.103.down_proj", "model.layers.68.mlp.experts.104.down_proj", "model.layers.68.mlp.experts.105.down_proj", "model.layers.68.mlp.experts.106.down_proj", "model.layers.68.mlp.experts.107.down_proj", "model.layers.68.mlp.experts.108.down_proj", "model.layers.68.mlp.experts.109.down_proj", "model.layers.68.mlp.experts.110.down_proj", "model.layers.68.mlp.experts.111.down_proj", "model.layers.68.mlp.experts.112.down_proj", "model.layers.68.mlp.experts.113.down_proj", "model.layers.68.mlp.experts.114.down_proj", "model.layers.68.mlp.experts.115.down_proj", "model.layers.68.mlp.experts.116.down_proj", "model.layers.68.mlp.experts.117.down_proj", "model.layers.68.mlp.experts.118.down_proj", "model.layers.68.mlp.experts.119.down_proj", "model.layers.68.mlp.experts.120.down_proj", "model.layers.68.mlp.experts.121.down_proj", "model.layers.68.mlp.experts.122.down_proj", "model.layers.68.mlp.experts.123.down_proj", "model.layers.68.mlp.experts.124.down_proj", "model.layers.68.mlp.experts.125.down_proj", "model.layers.68.mlp.experts.126.down_proj", "model.layers.68.mlp.experts.127.down_proj", "model.layers.68.mlp.experts.128.down_proj", "model.layers.68.mlp.experts.129.down_proj", "model.layers.68.mlp.experts.130.down_proj", "model.layers.68.mlp.experts.131.down_proj", "model.layers.68.mlp.experts.132.down_proj", "model.layers.68.mlp.experts.133.down_proj", "model.layers.68.mlp.experts.134.down_proj", "model.layers.68.mlp.experts.135.down_proj", "model.layers.68.mlp.experts.136.down_proj", "model.layers.68.mlp.experts.137.down_proj", "model.layers.68.mlp.experts.138.down_proj", "model.layers.68.mlp.experts.139.down_proj", "model.layers.68.mlp.experts.140.down_proj", "model.layers.68.mlp.experts.141.down_proj", "model.layers.68.mlp.experts.142.down_proj", "model.layers.68.mlp.experts.143.down_proj", "model.layers.68.mlp.experts.144.down_proj", "model.layers.68.mlp.experts.145.down_proj", "model.layers.68.mlp.experts.146.down_proj", "model.layers.68.mlp.experts.147.down_proj", "model.layers.68.mlp.experts.148.down_proj", "model.layers.68.mlp.experts.149.down_proj", "model.layers.68.mlp.experts.150.down_proj", "model.layers.68.mlp.experts.151.down_proj", "model.layers.68.mlp.experts.152.down_proj", "model.layers.68.mlp.experts.153.down_proj", "model.layers.68.mlp.experts.154.down_proj", "model.layers.68.mlp.experts.155.down_proj", "model.layers.68.mlp.experts.156.down_proj", "model.layers.68.mlp.experts.157.down_proj", "model.layers.68.mlp.experts.158.down_proj", "model.layers.68.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.1426472812891006e-05, "dbits": 1258291200 }, { "dkld": -2.4042092263698578e-05, "dbits": 2516582400 } ] }, { "idx": 411, "layers": [ "model.layers.69.self_attn.q_proj" ], "candidates": [ { "dkld": 1.2312526814640956e-05, "dbits": 62914560 }, { "dkld": 1.0861200280487537e-05, "dbits": 125829120 } ] }, { "idx": 412, "layers": [ "model.layers.69.self_attn.k_proj", "model.layers.69.self_attn.v_proj" ], "candidates": [ { "dkld": -2.3868191055952115e-05, "dbits": 10485760 }, { "dkld": -2.5639403611421238e-05, "dbits": 20971520 } ] }, { "idx": 413, "layers": [ "model.layers.69.self_attn.o_proj" ], "candidates": [ { "dkld": 1.5294179320335388e-05, "dbits": 62914560 }, { "dkld": 1.5060603618622867e-05, "dbits": 125829120 } ] }, { "idx": 414, "layers": [ "model.layers.69.mlp.shared_experts.gate_proj", "model.layers.69.mlp.shared_experts.up_proj", "model.layers.69.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 4.057271871715784e-05, "dbits": 23592960 }, { "dkld": 1.704655587673326e-05, "dbits": 47185920 } ] }, { "idx": 415, "layers": [ "model.layers.69.mlp.experts.0.gate_proj", "model.layers.69.mlp.experts.1.gate_proj", "model.layers.69.mlp.experts.2.gate_proj", "model.layers.69.mlp.experts.3.gate_proj", "model.layers.69.mlp.experts.4.gate_proj", "model.layers.69.mlp.experts.5.gate_proj", "model.layers.69.mlp.experts.6.gate_proj", "model.layers.69.mlp.experts.7.gate_proj", "model.layers.69.mlp.experts.8.gate_proj", "model.layers.69.mlp.experts.9.gate_proj", "model.layers.69.mlp.experts.10.gate_proj", "model.layers.69.mlp.experts.11.gate_proj", "model.layers.69.mlp.experts.12.gate_proj", "model.layers.69.mlp.experts.13.gate_proj", "model.layers.69.mlp.experts.14.gate_proj", "model.layers.69.mlp.experts.15.gate_proj", "model.layers.69.mlp.experts.16.gate_proj", "model.layers.69.mlp.experts.17.gate_proj", "model.layers.69.mlp.experts.18.gate_proj", "model.layers.69.mlp.experts.19.gate_proj", "model.layers.69.mlp.experts.20.gate_proj", "model.layers.69.mlp.experts.21.gate_proj", "model.layers.69.mlp.experts.22.gate_proj", "model.layers.69.mlp.experts.23.gate_proj", "model.layers.69.mlp.experts.24.gate_proj", "model.layers.69.mlp.experts.25.gate_proj", "model.layers.69.mlp.experts.26.gate_proj", "model.layers.69.mlp.experts.27.gate_proj", "model.layers.69.mlp.experts.28.gate_proj", "model.layers.69.mlp.experts.29.gate_proj", "model.layers.69.mlp.experts.30.gate_proj", "model.layers.69.mlp.experts.31.gate_proj", "model.layers.69.mlp.experts.32.gate_proj", "model.layers.69.mlp.experts.33.gate_proj", "model.layers.69.mlp.experts.34.gate_proj", "model.layers.69.mlp.experts.35.gate_proj", "model.layers.69.mlp.experts.36.gate_proj", "model.layers.69.mlp.experts.37.gate_proj", "model.layers.69.mlp.experts.38.gate_proj", "model.layers.69.mlp.experts.39.gate_proj", "model.layers.69.mlp.experts.40.gate_proj", "model.layers.69.mlp.experts.41.gate_proj", "model.layers.69.mlp.experts.42.gate_proj", "model.layers.69.mlp.experts.43.gate_proj", "model.layers.69.mlp.experts.44.gate_proj", "model.layers.69.mlp.experts.45.gate_proj", "model.layers.69.mlp.experts.46.gate_proj", "model.layers.69.mlp.experts.47.gate_proj", "model.layers.69.mlp.experts.48.gate_proj", "model.layers.69.mlp.experts.49.gate_proj", "model.layers.69.mlp.experts.50.gate_proj", "model.layers.69.mlp.experts.51.gate_proj", "model.layers.69.mlp.experts.52.gate_proj", "model.layers.69.mlp.experts.53.gate_proj", "model.layers.69.mlp.experts.54.gate_proj", "model.layers.69.mlp.experts.55.gate_proj", "model.layers.69.mlp.experts.56.gate_proj", "model.layers.69.mlp.experts.57.gate_proj", "model.layers.69.mlp.experts.58.gate_proj", "model.layers.69.mlp.experts.59.gate_proj", "model.layers.69.mlp.experts.60.gate_proj", "model.layers.69.mlp.experts.61.gate_proj", "model.layers.69.mlp.experts.62.gate_proj", "model.layers.69.mlp.experts.63.gate_proj", "model.layers.69.mlp.experts.64.gate_proj", "model.layers.69.mlp.experts.65.gate_proj", "model.layers.69.mlp.experts.66.gate_proj", "model.layers.69.mlp.experts.67.gate_proj", "model.layers.69.mlp.experts.68.gate_proj", "model.layers.69.mlp.experts.69.gate_proj", "model.layers.69.mlp.experts.70.gate_proj", "model.layers.69.mlp.experts.71.gate_proj", "model.layers.69.mlp.experts.72.gate_proj", "model.layers.69.mlp.experts.73.gate_proj", "model.layers.69.mlp.experts.74.gate_proj", "model.layers.69.mlp.experts.75.gate_proj", "model.layers.69.mlp.experts.76.gate_proj", "model.layers.69.mlp.experts.77.gate_proj", "model.layers.69.mlp.experts.78.gate_proj", "model.layers.69.mlp.experts.79.gate_proj", "model.layers.69.mlp.experts.80.gate_proj", "model.layers.69.mlp.experts.81.gate_proj", "model.layers.69.mlp.experts.82.gate_proj", "model.layers.69.mlp.experts.83.gate_proj", "model.layers.69.mlp.experts.84.gate_proj", "model.layers.69.mlp.experts.85.gate_proj", "model.layers.69.mlp.experts.86.gate_proj", "model.layers.69.mlp.experts.87.gate_proj", "model.layers.69.mlp.experts.88.gate_proj", "model.layers.69.mlp.experts.89.gate_proj", "model.layers.69.mlp.experts.90.gate_proj", "model.layers.69.mlp.experts.91.gate_proj", "model.layers.69.mlp.experts.92.gate_proj", "model.layers.69.mlp.experts.93.gate_proj", "model.layers.69.mlp.experts.94.gate_proj", "model.layers.69.mlp.experts.95.gate_proj", "model.layers.69.mlp.experts.96.gate_proj", "model.layers.69.mlp.experts.97.gate_proj", "model.layers.69.mlp.experts.98.gate_proj", "model.layers.69.mlp.experts.99.gate_proj", "model.layers.69.mlp.experts.100.gate_proj", "model.layers.69.mlp.experts.101.gate_proj", "model.layers.69.mlp.experts.102.gate_proj", "model.layers.69.mlp.experts.103.gate_proj", "model.layers.69.mlp.experts.104.gate_proj", "model.layers.69.mlp.experts.105.gate_proj", "model.layers.69.mlp.experts.106.gate_proj", "model.layers.69.mlp.experts.107.gate_proj", "model.layers.69.mlp.experts.108.gate_proj", "model.layers.69.mlp.experts.109.gate_proj", "model.layers.69.mlp.experts.110.gate_proj", "model.layers.69.mlp.experts.111.gate_proj", "model.layers.69.mlp.experts.112.gate_proj", "model.layers.69.mlp.experts.113.gate_proj", "model.layers.69.mlp.experts.114.gate_proj", "model.layers.69.mlp.experts.115.gate_proj", "model.layers.69.mlp.experts.116.gate_proj", "model.layers.69.mlp.experts.117.gate_proj", "model.layers.69.mlp.experts.118.gate_proj", "model.layers.69.mlp.experts.119.gate_proj", "model.layers.69.mlp.experts.120.gate_proj", "model.layers.69.mlp.experts.121.gate_proj", "model.layers.69.mlp.experts.122.gate_proj", "model.layers.69.mlp.experts.123.gate_proj", "model.layers.69.mlp.experts.124.gate_proj", "model.layers.69.mlp.experts.125.gate_proj", "model.layers.69.mlp.experts.126.gate_proj", "model.layers.69.mlp.experts.127.gate_proj", "model.layers.69.mlp.experts.128.gate_proj", "model.layers.69.mlp.experts.129.gate_proj", "model.layers.69.mlp.experts.130.gate_proj", "model.layers.69.mlp.experts.131.gate_proj", "model.layers.69.mlp.experts.132.gate_proj", "model.layers.69.mlp.experts.133.gate_proj", "model.layers.69.mlp.experts.134.gate_proj", "model.layers.69.mlp.experts.135.gate_proj", "model.layers.69.mlp.experts.136.gate_proj", "model.layers.69.mlp.experts.137.gate_proj", "model.layers.69.mlp.experts.138.gate_proj", "model.layers.69.mlp.experts.139.gate_proj", "model.layers.69.mlp.experts.140.gate_proj", "model.layers.69.mlp.experts.141.gate_proj", "model.layers.69.mlp.experts.142.gate_proj", "model.layers.69.mlp.experts.143.gate_proj", "model.layers.69.mlp.experts.144.gate_proj", "model.layers.69.mlp.experts.145.gate_proj", "model.layers.69.mlp.experts.146.gate_proj", "model.layers.69.mlp.experts.147.gate_proj", "model.layers.69.mlp.experts.148.gate_proj", "model.layers.69.mlp.experts.149.gate_proj", "model.layers.69.mlp.experts.150.gate_proj", "model.layers.69.mlp.experts.151.gate_proj", "model.layers.69.mlp.experts.152.gate_proj", "model.layers.69.mlp.experts.153.gate_proj", "model.layers.69.mlp.experts.154.gate_proj", "model.layers.69.mlp.experts.155.gate_proj", "model.layers.69.mlp.experts.156.gate_proj", "model.layers.69.mlp.experts.157.gate_proj", "model.layers.69.mlp.experts.158.gate_proj", "model.layers.69.mlp.experts.159.gate_proj", "model.layers.69.mlp.experts.0.up_proj", "model.layers.69.mlp.experts.1.up_proj", "model.layers.69.mlp.experts.2.up_proj", "model.layers.69.mlp.experts.3.up_proj", "model.layers.69.mlp.experts.4.up_proj", "model.layers.69.mlp.experts.5.up_proj", "model.layers.69.mlp.experts.6.up_proj", "model.layers.69.mlp.experts.7.up_proj", "model.layers.69.mlp.experts.8.up_proj", "model.layers.69.mlp.experts.9.up_proj", "model.layers.69.mlp.experts.10.up_proj", "model.layers.69.mlp.experts.11.up_proj", "model.layers.69.mlp.experts.12.up_proj", "model.layers.69.mlp.experts.13.up_proj", "model.layers.69.mlp.experts.14.up_proj", "model.layers.69.mlp.experts.15.up_proj", "model.layers.69.mlp.experts.16.up_proj", "model.layers.69.mlp.experts.17.up_proj", "model.layers.69.mlp.experts.18.up_proj", "model.layers.69.mlp.experts.19.up_proj", "model.layers.69.mlp.experts.20.up_proj", "model.layers.69.mlp.experts.21.up_proj", "model.layers.69.mlp.experts.22.up_proj", "model.layers.69.mlp.experts.23.up_proj", "model.layers.69.mlp.experts.24.up_proj", "model.layers.69.mlp.experts.25.up_proj", "model.layers.69.mlp.experts.26.up_proj", "model.layers.69.mlp.experts.27.up_proj", "model.layers.69.mlp.experts.28.up_proj", "model.layers.69.mlp.experts.29.up_proj", "model.layers.69.mlp.experts.30.up_proj", "model.layers.69.mlp.experts.31.up_proj", "model.layers.69.mlp.experts.32.up_proj", "model.layers.69.mlp.experts.33.up_proj", "model.layers.69.mlp.experts.34.up_proj", "model.layers.69.mlp.experts.35.up_proj", "model.layers.69.mlp.experts.36.up_proj", "model.layers.69.mlp.experts.37.up_proj", "model.layers.69.mlp.experts.38.up_proj", "model.layers.69.mlp.experts.39.up_proj", "model.layers.69.mlp.experts.40.up_proj", "model.layers.69.mlp.experts.41.up_proj", "model.layers.69.mlp.experts.42.up_proj", "model.layers.69.mlp.experts.43.up_proj", "model.layers.69.mlp.experts.44.up_proj", "model.layers.69.mlp.experts.45.up_proj", "model.layers.69.mlp.experts.46.up_proj", "model.layers.69.mlp.experts.47.up_proj", "model.layers.69.mlp.experts.48.up_proj", "model.layers.69.mlp.experts.49.up_proj", "model.layers.69.mlp.experts.50.up_proj", "model.layers.69.mlp.experts.51.up_proj", "model.layers.69.mlp.experts.52.up_proj", "model.layers.69.mlp.experts.53.up_proj", "model.layers.69.mlp.experts.54.up_proj", "model.layers.69.mlp.experts.55.up_proj", "model.layers.69.mlp.experts.56.up_proj", "model.layers.69.mlp.experts.57.up_proj", "model.layers.69.mlp.experts.58.up_proj", "model.layers.69.mlp.experts.59.up_proj", "model.layers.69.mlp.experts.60.up_proj", "model.layers.69.mlp.experts.61.up_proj", "model.layers.69.mlp.experts.62.up_proj", "model.layers.69.mlp.experts.63.up_proj", "model.layers.69.mlp.experts.64.up_proj", "model.layers.69.mlp.experts.65.up_proj", "model.layers.69.mlp.experts.66.up_proj", "model.layers.69.mlp.experts.67.up_proj", "model.layers.69.mlp.experts.68.up_proj", "model.layers.69.mlp.experts.69.up_proj", "model.layers.69.mlp.experts.70.up_proj", "model.layers.69.mlp.experts.71.up_proj", "model.layers.69.mlp.experts.72.up_proj", "model.layers.69.mlp.experts.73.up_proj", "model.layers.69.mlp.experts.74.up_proj", "model.layers.69.mlp.experts.75.up_proj", "model.layers.69.mlp.experts.76.up_proj", "model.layers.69.mlp.experts.77.up_proj", "model.layers.69.mlp.experts.78.up_proj", "model.layers.69.mlp.experts.79.up_proj", "model.layers.69.mlp.experts.80.up_proj", "model.layers.69.mlp.experts.81.up_proj", "model.layers.69.mlp.experts.82.up_proj", "model.layers.69.mlp.experts.83.up_proj", "model.layers.69.mlp.experts.84.up_proj", "model.layers.69.mlp.experts.85.up_proj", "model.layers.69.mlp.experts.86.up_proj", "model.layers.69.mlp.experts.87.up_proj", "model.layers.69.mlp.experts.88.up_proj", "model.layers.69.mlp.experts.89.up_proj", "model.layers.69.mlp.experts.90.up_proj", "model.layers.69.mlp.experts.91.up_proj", "model.layers.69.mlp.experts.92.up_proj", "model.layers.69.mlp.experts.93.up_proj", "model.layers.69.mlp.experts.94.up_proj", "model.layers.69.mlp.experts.95.up_proj", "model.layers.69.mlp.experts.96.up_proj", "model.layers.69.mlp.experts.97.up_proj", "model.layers.69.mlp.experts.98.up_proj", "model.layers.69.mlp.experts.99.up_proj", "model.layers.69.mlp.experts.100.up_proj", "model.layers.69.mlp.experts.101.up_proj", "model.layers.69.mlp.experts.102.up_proj", "model.layers.69.mlp.experts.103.up_proj", "model.layers.69.mlp.experts.104.up_proj", "model.layers.69.mlp.experts.105.up_proj", "model.layers.69.mlp.experts.106.up_proj", "model.layers.69.mlp.experts.107.up_proj", "model.layers.69.mlp.experts.108.up_proj", "model.layers.69.mlp.experts.109.up_proj", "model.layers.69.mlp.experts.110.up_proj", "model.layers.69.mlp.experts.111.up_proj", "model.layers.69.mlp.experts.112.up_proj", "model.layers.69.mlp.experts.113.up_proj", "model.layers.69.mlp.experts.114.up_proj", "model.layers.69.mlp.experts.115.up_proj", "model.layers.69.mlp.experts.116.up_proj", "model.layers.69.mlp.experts.117.up_proj", "model.layers.69.mlp.experts.118.up_proj", "model.layers.69.mlp.experts.119.up_proj", "model.layers.69.mlp.experts.120.up_proj", "model.layers.69.mlp.experts.121.up_proj", "model.layers.69.mlp.experts.122.up_proj", "model.layers.69.mlp.experts.123.up_proj", "model.layers.69.mlp.experts.124.up_proj", "model.layers.69.mlp.experts.125.up_proj", "model.layers.69.mlp.experts.126.up_proj", "model.layers.69.mlp.experts.127.up_proj", "model.layers.69.mlp.experts.128.up_proj", "model.layers.69.mlp.experts.129.up_proj", "model.layers.69.mlp.experts.130.up_proj", "model.layers.69.mlp.experts.131.up_proj", "model.layers.69.mlp.experts.132.up_proj", "model.layers.69.mlp.experts.133.up_proj", "model.layers.69.mlp.experts.134.up_proj", "model.layers.69.mlp.experts.135.up_proj", "model.layers.69.mlp.experts.136.up_proj", "model.layers.69.mlp.experts.137.up_proj", "model.layers.69.mlp.experts.138.up_proj", "model.layers.69.mlp.experts.139.up_proj", "model.layers.69.mlp.experts.140.up_proj", "model.layers.69.mlp.experts.141.up_proj", "model.layers.69.mlp.experts.142.up_proj", "model.layers.69.mlp.experts.143.up_proj", "model.layers.69.mlp.experts.144.up_proj", "model.layers.69.mlp.experts.145.up_proj", "model.layers.69.mlp.experts.146.up_proj", "model.layers.69.mlp.experts.147.up_proj", "model.layers.69.mlp.experts.148.up_proj", "model.layers.69.mlp.experts.149.up_proj", "model.layers.69.mlp.experts.150.up_proj", "model.layers.69.mlp.experts.151.up_proj", "model.layers.69.mlp.experts.152.up_proj", "model.layers.69.mlp.experts.153.up_proj", "model.layers.69.mlp.experts.154.up_proj", "model.layers.69.mlp.experts.155.up_proj", "model.layers.69.mlp.experts.156.up_proj", "model.layers.69.mlp.experts.157.up_proj", "model.layers.69.mlp.experts.158.up_proj", "model.layers.69.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.3713794760405323e-05, "dbits": 2516582400 }, { "dkld": -1.667984761297668e-05, "dbits": 5033164800 } ] }, { "idx": 416, "layers": [ "model.layers.69.mlp.experts.0.down_proj", "model.layers.69.mlp.experts.1.down_proj", "model.layers.69.mlp.experts.2.down_proj", "model.layers.69.mlp.experts.3.down_proj", "model.layers.69.mlp.experts.4.down_proj", "model.layers.69.mlp.experts.5.down_proj", "model.layers.69.mlp.experts.6.down_proj", "model.layers.69.mlp.experts.7.down_proj", "model.layers.69.mlp.experts.8.down_proj", "model.layers.69.mlp.experts.9.down_proj", "model.layers.69.mlp.experts.10.down_proj", "model.layers.69.mlp.experts.11.down_proj", "model.layers.69.mlp.experts.12.down_proj", "model.layers.69.mlp.experts.13.down_proj", "model.layers.69.mlp.experts.14.down_proj", "model.layers.69.mlp.experts.15.down_proj", "model.layers.69.mlp.experts.16.down_proj", "model.layers.69.mlp.experts.17.down_proj", "model.layers.69.mlp.experts.18.down_proj", "model.layers.69.mlp.experts.19.down_proj", "model.layers.69.mlp.experts.20.down_proj", "model.layers.69.mlp.experts.21.down_proj", "model.layers.69.mlp.experts.22.down_proj", "model.layers.69.mlp.experts.23.down_proj", "model.layers.69.mlp.experts.24.down_proj", "model.layers.69.mlp.experts.25.down_proj", "model.layers.69.mlp.experts.26.down_proj", "model.layers.69.mlp.experts.27.down_proj", "model.layers.69.mlp.experts.28.down_proj", "model.layers.69.mlp.experts.29.down_proj", "model.layers.69.mlp.experts.30.down_proj", "model.layers.69.mlp.experts.31.down_proj", "model.layers.69.mlp.experts.32.down_proj", "model.layers.69.mlp.experts.33.down_proj", "model.layers.69.mlp.experts.34.down_proj", "model.layers.69.mlp.experts.35.down_proj", "model.layers.69.mlp.experts.36.down_proj", "model.layers.69.mlp.experts.37.down_proj", "model.layers.69.mlp.experts.38.down_proj", "model.layers.69.mlp.experts.39.down_proj", "model.layers.69.mlp.experts.40.down_proj", "model.layers.69.mlp.experts.41.down_proj", "model.layers.69.mlp.experts.42.down_proj", "model.layers.69.mlp.experts.43.down_proj", "model.layers.69.mlp.experts.44.down_proj", "model.layers.69.mlp.experts.45.down_proj", "model.layers.69.mlp.experts.46.down_proj", "model.layers.69.mlp.experts.47.down_proj", "model.layers.69.mlp.experts.48.down_proj", "model.layers.69.mlp.experts.49.down_proj", "model.layers.69.mlp.experts.50.down_proj", "model.layers.69.mlp.experts.51.down_proj", "model.layers.69.mlp.experts.52.down_proj", "model.layers.69.mlp.experts.53.down_proj", "model.layers.69.mlp.experts.54.down_proj", "model.layers.69.mlp.experts.55.down_proj", "model.layers.69.mlp.experts.56.down_proj", "model.layers.69.mlp.experts.57.down_proj", "model.layers.69.mlp.experts.58.down_proj", "model.layers.69.mlp.experts.59.down_proj", "model.layers.69.mlp.experts.60.down_proj", "model.layers.69.mlp.experts.61.down_proj", "model.layers.69.mlp.experts.62.down_proj", "model.layers.69.mlp.experts.63.down_proj", "model.layers.69.mlp.experts.64.down_proj", "model.layers.69.mlp.experts.65.down_proj", "model.layers.69.mlp.experts.66.down_proj", "model.layers.69.mlp.experts.67.down_proj", "model.layers.69.mlp.experts.68.down_proj", "model.layers.69.mlp.experts.69.down_proj", "model.layers.69.mlp.experts.70.down_proj", "model.layers.69.mlp.experts.71.down_proj", "model.layers.69.mlp.experts.72.down_proj", "model.layers.69.mlp.experts.73.down_proj", "model.layers.69.mlp.experts.74.down_proj", "model.layers.69.mlp.experts.75.down_proj", "model.layers.69.mlp.experts.76.down_proj", "model.layers.69.mlp.experts.77.down_proj", "model.layers.69.mlp.experts.78.down_proj", "model.layers.69.mlp.experts.79.down_proj", "model.layers.69.mlp.experts.80.down_proj", "model.layers.69.mlp.experts.81.down_proj", "model.layers.69.mlp.experts.82.down_proj", "model.layers.69.mlp.experts.83.down_proj", "model.layers.69.mlp.experts.84.down_proj", "model.layers.69.mlp.experts.85.down_proj", "model.layers.69.mlp.experts.86.down_proj", "model.layers.69.mlp.experts.87.down_proj", "model.layers.69.mlp.experts.88.down_proj", "model.layers.69.mlp.experts.89.down_proj", "model.layers.69.mlp.experts.90.down_proj", "model.layers.69.mlp.experts.91.down_proj", "model.layers.69.mlp.experts.92.down_proj", "model.layers.69.mlp.experts.93.down_proj", "model.layers.69.mlp.experts.94.down_proj", "model.layers.69.mlp.experts.95.down_proj", "model.layers.69.mlp.experts.96.down_proj", "model.layers.69.mlp.experts.97.down_proj", "model.layers.69.mlp.experts.98.down_proj", "model.layers.69.mlp.experts.99.down_proj", "model.layers.69.mlp.experts.100.down_proj", "model.layers.69.mlp.experts.101.down_proj", "model.layers.69.mlp.experts.102.down_proj", "model.layers.69.mlp.experts.103.down_proj", "model.layers.69.mlp.experts.104.down_proj", "model.layers.69.mlp.experts.105.down_proj", "model.layers.69.mlp.experts.106.down_proj", "model.layers.69.mlp.experts.107.down_proj", "model.layers.69.mlp.experts.108.down_proj", "model.layers.69.mlp.experts.109.down_proj", "model.layers.69.mlp.experts.110.down_proj", "model.layers.69.mlp.experts.111.down_proj", "model.layers.69.mlp.experts.112.down_proj", "model.layers.69.mlp.experts.113.down_proj", "model.layers.69.mlp.experts.114.down_proj", "model.layers.69.mlp.experts.115.down_proj", "model.layers.69.mlp.experts.116.down_proj", "model.layers.69.mlp.experts.117.down_proj", "model.layers.69.mlp.experts.118.down_proj", "model.layers.69.mlp.experts.119.down_proj", "model.layers.69.mlp.experts.120.down_proj", "model.layers.69.mlp.experts.121.down_proj", "model.layers.69.mlp.experts.122.down_proj", "model.layers.69.mlp.experts.123.down_proj", "model.layers.69.mlp.experts.124.down_proj", "model.layers.69.mlp.experts.125.down_proj", "model.layers.69.mlp.experts.126.down_proj", "model.layers.69.mlp.experts.127.down_proj", "model.layers.69.mlp.experts.128.down_proj", "model.layers.69.mlp.experts.129.down_proj", "model.layers.69.mlp.experts.130.down_proj", "model.layers.69.mlp.experts.131.down_proj", "model.layers.69.mlp.experts.132.down_proj", "model.layers.69.mlp.experts.133.down_proj", "model.layers.69.mlp.experts.134.down_proj", "model.layers.69.mlp.experts.135.down_proj", "model.layers.69.mlp.experts.136.down_proj", "model.layers.69.mlp.experts.137.down_proj", "model.layers.69.mlp.experts.138.down_proj", "model.layers.69.mlp.experts.139.down_proj", "model.layers.69.mlp.experts.140.down_proj", "model.layers.69.mlp.experts.141.down_proj", "model.layers.69.mlp.experts.142.down_proj", "model.layers.69.mlp.experts.143.down_proj", "model.layers.69.mlp.experts.144.down_proj", "model.layers.69.mlp.experts.145.down_proj", "model.layers.69.mlp.experts.146.down_proj", "model.layers.69.mlp.experts.147.down_proj", "model.layers.69.mlp.experts.148.down_proj", "model.layers.69.mlp.experts.149.down_proj", "model.layers.69.mlp.experts.150.down_proj", "model.layers.69.mlp.experts.151.down_proj", "model.layers.69.mlp.experts.152.down_proj", "model.layers.69.mlp.experts.153.down_proj", "model.layers.69.mlp.experts.154.down_proj", "model.layers.69.mlp.experts.155.down_proj", "model.layers.69.mlp.experts.156.down_proj", "model.layers.69.mlp.experts.157.down_proj", "model.layers.69.mlp.experts.158.down_proj", "model.layers.69.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.6135070472954316e-05, "dbits": 1258291200 }, { "dkld": -3.387429751455437e-06, "dbits": 2516582400 } ] }, { "idx": 417, "layers": [ "model.layers.70.self_attn.q_proj" ], "candidates": [ { "dkld": 6.541842594742775e-06, "dbits": 62914560 }, { "dkld": -3.3742049708948563e-06, "dbits": 125829120 } ] }, { "idx": 418, "layers": [ "model.layers.70.self_attn.k_proj", "model.layers.70.self_attn.v_proj" ], "candidates": [ { "dkld": 2.014024648815463e-05, "dbits": 10485760 }, { "dkld": 1.259816344827483e-05, "dbits": 20971520 } ] }, { "idx": 419, "layers": [ "model.layers.70.self_attn.o_proj" ], "candidates": [ { "dkld": -3.905384801328182e-06, "dbits": 62914560 }, { "dkld": -1.4933198690413041e-05, "dbits": 125829120 } ] }, { "idx": 420, "layers": [ "model.layers.70.mlp.shared_experts.gate_proj", "model.layers.70.mlp.shared_experts.up_proj", "model.layers.70.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 2.8971116989851e-06, "dbits": 23592960 }, { "dkld": -1.7635105177759083e-05, "dbits": 47185920 } ] }, { "idx": 421, "layers": [ "model.layers.70.mlp.experts.0.gate_proj", "model.layers.70.mlp.experts.1.gate_proj", "model.layers.70.mlp.experts.2.gate_proj", "model.layers.70.mlp.experts.3.gate_proj", "model.layers.70.mlp.experts.4.gate_proj", "model.layers.70.mlp.experts.5.gate_proj", "model.layers.70.mlp.experts.6.gate_proj", "model.layers.70.mlp.experts.7.gate_proj", "model.layers.70.mlp.experts.8.gate_proj", "model.layers.70.mlp.experts.9.gate_proj", "model.layers.70.mlp.experts.10.gate_proj", "model.layers.70.mlp.experts.11.gate_proj", "model.layers.70.mlp.experts.12.gate_proj", "model.layers.70.mlp.experts.13.gate_proj", "model.layers.70.mlp.experts.14.gate_proj", "model.layers.70.mlp.experts.15.gate_proj", "model.layers.70.mlp.experts.16.gate_proj", "model.layers.70.mlp.experts.17.gate_proj", "model.layers.70.mlp.experts.18.gate_proj", "model.layers.70.mlp.experts.19.gate_proj", "model.layers.70.mlp.experts.20.gate_proj", "model.layers.70.mlp.experts.21.gate_proj", "model.layers.70.mlp.experts.22.gate_proj", "model.layers.70.mlp.experts.23.gate_proj", "model.layers.70.mlp.experts.24.gate_proj", "model.layers.70.mlp.experts.25.gate_proj", "model.layers.70.mlp.experts.26.gate_proj", "model.layers.70.mlp.experts.27.gate_proj", "model.layers.70.mlp.experts.28.gate_proj", "model.layers.70.mlp.experts.29.gate_proj", "model.layers.70.mlp.experts.30.gate_proj", "model.layers.70.mlp.experts.31.gate_proj", "model.layers.70.mlp.experts.32.gate_proj", "model.layers.70.mlp.experts.33.gate_proj", "model.layers.70.mlp.experts.34.gate_proj", "model.layers.70.mlp.experts.35.gate_proj", "model.layers.70.mlp.experts.36.gate_proj", "model.layers.70.mlp.experts.37.gate_proj", "model.layers.70.mlp.experts.38.gate_proj", "model.layers.70.mlp.experts.39.gate_proj", "model.layers.70.mlp.experts.40.gate_proj", "model.layers.70.mlp.experts.41.gate_proj", "model.layers.70.mlp.experts.42.gate_proj", "model.layers.70.mlp.experts.43.gate_proj", "model.layers.70.mlp.experts.44.gate_proj", "model.layers.70.mlp.experts.45.gate_proj", "model.layers.70.mlp.experts.46.gate_proj", "model.layers.70.mlp.experts.47.gate_proj", "model.layers.70.mlp.experts.48.gate_proj", "model.layers.70.mlp.experts.49.gate_proj", "model.layers.70.mlp.experts.50.gate_proj", "model.layers.70.mlp.experts.51.gate_proj", "model.layers.70.mlp.experts.52.gate_proj", "model.layers.70.mlp.experts.53.gate_proj", "model.layers.70.mlp.experts.54.gate_proj", "model.layers.70.mlp.experts.55.gate_proj", "model.layers.70.mlp.experts.56.gate_proj", "model.layers.70.mlp.experts.57.gate_proj", "model.layers.70.mlp.experts.58.gate_proj", "model.layers.70.mlp.experts.59.gate_proj", "model.layers.70.mlp.experts.60.gate_proj", "model.layers.70.mlp.experts.61.gate_proj", "model.layers.70.mlp.experts.62.gate_proj", "model.layers.70.mlp.experts.63.gate_proj", "model.layers.70.mlp.experts.64.gate_proj", "model.layers.70.mlp.experts.65.gate_proj", "model.layers.70.mlp.experts.66.gate_proj", "model.layers.70.mlp.experts.67.gate_proj", "model.layers.70.mlp.experts.68.gate_proj", "model.layers.70.mlp.experts.69.gate_proj", "model.layers.70.mlp.experts.70.gate_proj", "model.layers.70.mlp.experts.71.gate_proj", "model.layers.70.mlp.experts.72.gate_proj", "model.layers.70.mlp.experts.73.gate_proj", "model.layers.70.mlp.experts.74.gate_proj", "model.layers.70.mlp.experts.75.gate_proj", "model.layers.70.mlp.experts.76.gate_proj", "model.layers.70.mlp.experts.77.gate_proj", "model.layers.70.mlp.experts.78.gate_proj", "model.layers.70.mlp.experts.79.gate_proj", "model.layers.70.mlp.experts.80.gate_proj", "model.layers.70.mlp.experts.81.gate_proj", "model.layers.70.mlp.experts.82.gate_proj", "model.layers.70.mlp.experts.83.gate_proj", "model.layers.70.mlp.experts.84.gate_proj", "model.layers.70.mlp.experts.85.gate_proj", "model.layers.70.mlp.experts.86.gate_proj", "model.layers.70.mlp.experts.87.gate_proj", "model.layers.70.mlp.experts.88.gate_proj", "model.layers.70.mlp.experts.89.gate_proj", "model.layers.70.mlp.experts.90.gate_proj", "model.layers.70.mlp.experts.91.gate_proj", "model.layers.70.mlp.experts.92.gate_proj", "model.layers.70.mlp.experts.93.gate_proj", "model.layers.70.mlp.experts.94.gate_proj", "model.layers.70.mlp.experts.95.gate_proj", "model.layers.70.mlp.experts.96.gate_proj", "model.layers.70.mlp.experts.97.gate_proj", "model.layers.70.mlp.experts.98.gate_proj", "model.layers.70.mlp.experts.99.gate_proj", "model.layers.70.mlp.experts.100.gate_proj", "model.layers.70.mlp.experts.101.gate_proj", "model.layers.70.mlp.experts.102.gate_proj", "model.layers.70.mlp.experts.103.gate_proj", "model.layers.70.mlp.experts.104.gate_proj", "model.layers.70.mlp.experts.105.gate_proj", "model.layers.70.mlp.experts.106.gate_proj", "model.layers.70.mlp.experts.107.gate_proj", "model.layers.70.mlp.experts.108.gate_proj", "model.layers.70.mlp.experts.109.gate_proj", "model.layers.70.mlp.experts.110.gate_proj", "model.layers.70.mlp.experts.111.gate_proj", "model.layers.70.mlp.experts.112.gate_proj", "model.layers.70.mlp.experts.113.gate_proj", "model.layers.70.mlp.experts.114.gate_proj", "model.layers.70.mlp.experts.115.gate_proj", "model.layers.70.mlp.experts.116.gate_proj", "model.layers.70.mlp.experts.117.gate_proj", "model.layers.70.mlp.experts.118.gate_proj", "model.layers.70.mlp.experts.119.gate_proj", "model.layers.70.mlp.experts.120.gate_proj", "model.layers.70.mlp.experts.121.gate_proj", "model.layers.70.mlp.experts.122.gate_proj", "model.layers.70.mlp.experts.123.gate_proj", "model.layers.70.mlp.experts.124.gate_proj", "model.layers.70.mlp.experts.125.gate_proj", "model.layers.70.mlp.experts.126.gate_proj", "model.layers.70.mlp.experts.127.gate_proj", "model.layers.70.mlp.experts.128.gate_proj", "model.layers.70.mlp.experts.129.gate_proj", "model.layers.70.mlp.experts.130.gate_proj", "model.layers.70.mlp.experts.131.gate_proj", "model.layers.70.mlp.experts.132.gate_proj", "model.layers.70.mlp.experts.133.gate_proj", "model.layers.70.mlp.experts.134.gate_proj", "model.layers.70.mlp.experts.135.gate_proj", "model.layers.70.mlp.experts.136.gate_proj", "model.layers.70.mlp.experts.137.gate_proj", "model.layers.70.mlp.experts.138.gate_proj", "model.layers.70.mlp.experts.139.gate_proj", "model.layers.70.mlp.experts.140.gate_proj", "model.layers.70.mlp.experts.141.gate_proj", "model.layers.70.mlp.experts.142.gate_proj", "model.layers.70.mlp.experts.143.gate_proj", "model.layers.70.mlp.experts.144.gate_proj", "model.layers.70.mlp.experts.145.gate_proj", "model.layers.70.mlp.experts.146.gate_proj", "model.layers.70.mlp.experts.147.gate_proj", "model.layers.70.mlp.experts.148.gate_proj", "model.layers.70.mlp.experts.149.gate_proj", "model.layers.70.mlp.experts.150.gate_proj", "model.layers.70.mlp.experts.151.gate_proj", "model.layers.70.mlp.experts.152.gate_proj", "model.layers.70.mlp.experts.153.gate_proj", "model.layers.70.mlp.experts.154.gate_proj", "model.layers.70.mlp.experts.155.gate_proj", "model.layers.70.mlp.experts.156.gate_proj", "model.layers.70.mlp.experts.157.gate_proj", "model.layers.70.mlp.experts.158.gate_proj", "model.layers.70.mlp.experts.159.gate_proj", "model.layers.70.mlp.experts.0.up_proj", "model.layers.70.mlp.experts.1.up_proj", "model.layers.70.mlp.experts.2.up_proj", "model.layers.70.mlp.experts.3.up_proj", "model.layers.70.mlp.experts.4.up_proj", "model.layers.70.mlp.experts.5.up_proj", "model.layers.70.mlp.experts.6.up_proj", "model.layers.70.mlp.experts.7.up_proj", "model.layers.70.mlp.experts.8.up_proj", "model.layers.70.mlp.experts.9.up_proj", "model.layers.70.mlp.experts.10.up_proj", "model.layers.70.mlp.experts.11.up_proj", "model.layers.70.mlp.experts.12.up_proj", "model.layers.70.mlp.experts.13.up_proj", "model.layers.70.mlp.experts.14.up_proj", "model.layers.70.mlp.experts.15.up_proj", "model.layers.70.mlp.experts.16.up_proj", "model.layers.70.mlp.experts.17.up_proj", "model.layers.70.mlp.experts.18.up_proj", "model.layers.70.mlp.experts.19.up_proj", "model.layers.70.mlp.experts.20.up_proj", "model.layers.70.mlp.experts.21.up_proj", "model.layers.70.mlp.experts.22.up_proj", "model.layers.70.mlp.experts.23.up_proj", "model.layers.70.mlp.experts.24.up_proj", "model.layers.70.mlp.experts.25.up_proj", "model.layers.70.mlp.experts.26.up_proj", "model.layers.70.mlp.experts.27.up_proj", "model.layers.70.mlp.experts.28.up_proj", "model.layers.70.mlp.experts.29.up_proj", "model.layers.70.mlp.experts.30.up_proj", "model.layers.70.mlp.experts.31.up_proj", "model.layers.70.mlp.experts.32.up_proj", "model.layers.70.mlp.experts.33.up_proj", "model.layers.70.mlp.experts.34.up_proj", "model.layers.70.mlp.experts.35.up_proj", "model.layers.70.mlp.experts.36.up_proj", "model.layers.70.mlp.experts.37.up_proj", "model.layers.70.mlp.experts.38.up_proj", "model.layers.70.mlp.experts.39.up_proj", "model.layers.70.mlp.experts.40.up_proj", "model.layers.70.mlp.experts.41.up_proj", "model.layers.70.mlp.experts.42.up_proj", "model.layers.70.mlp.experts.43.up_proj", "model.layers.70.mlp.experts.44.up_proj", "model.layers.70.mlp.experts.45.up_proj", "model.layers.70.mlp.experts.46.up_proj", "model.layers.70.mlp.experts.47.up_proj", "model.layers.70.mlp.experts.48.up_proj", "model.layers.70.mlp.experts.49.up_proj", "model.layers.70.mlp.experts.50.up_proj", "model.layers.70.mlp.experts.51.up_proj", "model.layers.70.mlp.experts.52.up_proj", "model.layers.70.mlp.experts.53.up_proj", "model.layers.70.mlp.experts.54.up_proj", "model.layers.70.mlp.experts.55.up_proj", "model.layers.70.mlp.experts.56.up_proj", "model.layers.70.mlp.experts.57.up_proj", "model.layers.70.mlp.experts.58.up_proj", "model.layers.70.mlp.experts.59.up_proj", "model.layers.70.mlp.experts.60.up_proj", "model.layers.70.mlp.experts.61.up_proj", "model.layers.70.mlp.experts.62.up_proj", "model.layers.70.mlp.experts.63.up_proj", "model.layers.70.mlp.experts.64.up_proj", "model.layers.70.mlp.experts.65.up_proj", "model.layers.70.mlp.experts.66.up_proj", "model.layers.70.mlp.experts.67.up_proj", "model.layers.70.mlp.experts.68.up_proj", "model.layers.70.mlp.experts.69.up_proj", "model.layers.70.mlp.experts.70.up_proj", "model.layers.70.mlp.experts.71.up_proj", "model.layers.70.mlp.experts.72.up_proj", "model.layers.70.mlp.experts.73.up_proj", "model.layers.70.mlp.experts.74.up_proj", "model.layers.70.mlp.experts.75.up_proj", "model.layers.70.mlp.experts.76.up_proj", "model.layers.70.mlp.experts.77.up_proj", "model.layers.70.mlp.experts.78.up_proj", "model.layers.70.mlp.experts.79.up_proj", "model.layers.70.mlp.experts.80.up_proj", "model.layers.70.mlp.experts.81.up_proj", "model.layers.70.mlp.experts.82.up_proj", "model.layers.70.mlp.experts.83.up_proj", "model.layers.70.mlp.experts.84.up_proj", "model.layers.70.mlp.experts.85.up_proj", "model.layers.70.mlp.experts.86.up_proj", "model.layers.70.mlp.experts.87.up_proj", "model.layers.70.mlp.experts.88.up_proj", "model.layers.70.mlp.experts.89.up_proj", "model.layers.70.mlp.experts.90.up_proj", "model.layers.70.mlp.experts.91.up_proj", "model.layers.70.mlp.experts.92.up_proj", "model.layers.70.mlp.experts.93.up_proj", "model.layers.70.mlp.experts.94.up_proj", "model.layers.70.mlp.experts.95.up_proj", "model.layers.70.mlp.experts.96.up_proj", "model.layers.70.mlp.experts.97.up_proj", "model.layers.70.mlp.experts.98.up_proj", "model.layers.70.mlp.experts.99.up_proj", "model.layers.70.mlp.experts.100.up_proj", "model.layers.70.mlp.experts.101.up_proj", "model.layers.70.mlp.experts.102.up_proj", "model.layers.70.mlp.experts.103.up_proj", "model.layers.70.mlp.experts.104.up_proj", "model.layers.70.mlp.experts.105.up_proj", "model.layers.70.mlp.experts.106.up_proj", "model.layers.70.mlp.experts.107.up_proj", "model.layers.70.mlp.experts.108.up_proj", "model.layers.70.mlp.experts.109.up_proj", "model.layers.70.mlp.experts.110.up_proj", "model.layers.70.mlp.experts.111.up_proj", "model.layers.70.mlp.experts.112.up_proj", "model.layers.70.mlp.experts.113.up_proj", "model.layers.70.mlp.experts.114.up_proj", "model.layers.70.mlp.experts.115.up_proj", "model.layers.70.mlp.experts.116.up_proj", "model.layers.70.mlp.experts.117.up_proj", "model.layers.70.mlp.experts.118.up_proj", "model.layers.70.mlp.experts.119.up_proj", "model.layers.70.mlp.experts.120.up_proj", "model.layers.70.mlp.experts.121.up_proj", "model.layers.70.mlp.experts.122.up_proj", "model.layers.70.mlp.experts.123.up_proj", "model.layers.70.mlp.experts.124.up_proj", "model.layers.70.mlp.experts.125.up_proj", "model.layers.70.mlp.experts.126.up_proj", "model.layers.70.mlp.experts.127.up_proj", "model.layers.70.mlp.experts.128.up_proj", "model.layers.70.mlp.experts.129.up_proj", "model.layers.70.mlp.experts.130.up_proj", "model.layers.70.mlp.experts.131.up_proj", "model.layers.70.mlp.experts.132.up_proj", "model.layers.70.mlp.experts.133.up_proj", "model.layers.70.mlp.experts.134.up_proj", "model.layers.70.mlp.experts.135.up_proj", "model.layers.70.mlp.experts.136.up_proj", "model.layers.70.mlp.experts.137.up_proj", "model.layers.70.mlp.experts.138.up_proj", "model.layers.70.mlp.experts.139.up_proj", "model.layers.70.mlp.experts.140.up_proj", "model.layers.70.mlp.experts.141.up_proj", "model.layers.70.mlp.experts.142.up_proj", "model.layers.70.mlp.experts.143.up_proj", "model.layers.70.mlp.experts.144.up_proj", "model.layers.70.mlp.experts.145.up_proj", "model.layers.70.mlp.experts.146.up_proj", "model.layers.70.mlp.experts.147.up_proj", "model.layers.70.mlp.experts.148.up_proj", "model.layers.70.mlp.experts.149.up_proj", "model.layers.70.mlp.experts.150.up_proj", "model.layers.70.mlp.experts.151.up_proj", "model.layers.70.mlp.experts.152.up_proj", "model.layers.70.mlp.experts.153.up_proj", "model.layers.70.mlp.experts.154.up_proj", "model.layers.70.mlp.experts.155.up_proj", "model.layers.70.mlp.experts.156.up_proj", "model.layers.70.mlp.experts.157.up_proj", "model.layers.70.mlp.experts.158.up_proj", "model.layers.70.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 6.318138912320831e-06, "dbits": 2516582400 }, { "dkld": -3.5071279853512993e-07, "dbits": 5033164800 } ] }, { "idx": 422, "layers": [ "model.layers.70.mlp.experts.0.down_proj", "model.layers.70.mlp.experts.1.down_proj", "model.layers.70.mlp.experts.2.down_proj", "model.layers.70.mlp.experts.3.down_proj", "model.layers.70.mlp.experts.4.down_proj", "model.layers.70.mlp.experts.5.down_proj", "model.layers.70.mlp.experts.6.down_proj", "model.layers.70.mlp.experts.7.down_proj", "model.layers.70.mlp.experts.8.down_proj", "model.layers.70.mlp.experts.9.down_proj", "model.layers.70.mlp.experts.10.down_proj", "model.layers.70.mlp.experts.11.down_proj", "model.layers.70.mlp.experts.12.down_proj", "model.layers.70.mlp.experts.13.down_proj", "model.layers.70.mlp.experts.14.down_proj", "model.layers.70.mlp.experts.15.down_proj", "model.layers.70.mlp.experts.16.down_proj", "model.layers.70.mlp.experts.17.down_proj", "model.layers.70.mlp.experts.18.down_proj", "model.layers.70.mlp.experts.19.down_proj", "model.layers.70.mlp.experts.20.down_proj", "model.layers.70.mlp.experts.21.down_proj", "model.layers.70.mlp.experts.22.down_proj", "model.layers.70.mlp.experts.23.down_proj", "model.layers.70.mlp.experts.24.down_proj", "model.layers.70.mlp.experts.25.down_proj", "model.layers.70.mlp.experts.26.down_proj", "model.layers.70.mlp.experts.27.down_proj", "model.layers.70.mlp.experts.28.down_proj", "model.layers.70.mlp.experts.29.down_proj", "model.layers.70.mlp.experts.30.down_proj", "model.layers.70.mlp.experts.31.down_proj", "model.layers.70.mlp.experts.32.down_proj", "model.layers.70.mlp.experts.33.down_proj", "model.layers.70.mlp.experts.34.down_proj", "model.layers.70.mlp.experts.35.down_proj", "model.layers.70.mlp.experts.36.down_proj", "model.layers.70.mlp.experts.37.down_proj", "model.layers.70.mlp.experts.38.down_proj", "model.layers.70.mlp.experts.39.down_proj", "model.layers.70.mlp.experts.40.down_proj", "model.layers.70.mlp.experts.41.down_proj", "model.layers.70.mlp.experts.42.down_proj", "model.layers.70.mlp.experts.43.down_proj", "model.layers.70.mlp.experts.44.down_proj", "model.layers.70.mlp.experts.45.down_proj", "model.layers.70.mlp.experts.46.down_proj", "model.layers.70.mlp.experts.47.down_proj", "model.layers.70.mlp.experts.48.down_proj", "model.layers.70.mlp.experts.49.down_proj", "model.layers.70.mlp.experts.50.down_proj", "model.layers.70.mlp.experts.51.down_proj", "model.layers.70.mlp.experts.52.down_proj", "model.layers.70.mlp.experts.53.down_proj", "model.layers.70.mlp.experts.54.down_proj", "model.layers.70.mlp.experts.55.down_proj", "model.layers.70.mlp.experts.56.down_proj", "model.layers.70.mlp.experts.57.down_proj", "model.layers.70.mlp.experts.58.down_proj", "model.layers.70.mlp.experts.59.down_proj", "model.layers.70.mlp.experts.60.down_proj", "model.layers.70.mlp.experts.61.down_proj", "model.layers.70.mlp.experts.62.down_proj", "model.layers.70.mlp.experts.63.down_proj", "model.layers.70.mlp.experts.64.down_proj", "model.layers.70.mlp.experts.65.down_proj", "model.layers.70.mlp.experts.66.down_proj", "model.layers.70.mlp.experts.67.down_proj", "model.layers.70.mlp.experts.68.down_proj", "model.layers.70.mlp.experts.69.down_proj", "model.layers.70.mlp.experts.70.down_proj", "model.layers.70.mlp.experts.71.down_proj", "model.layers.70.mlp.experts.72.down_proj", "model.layers.70.mlp.experts.73.down_proj", "model.layers.70.mlp.experts.74.down_proj", "model.layers.70.mlp.experts.75.down_proj", "model.layers.70.mlp.experts.76.down_proj", "model.layers.70.mlp.experts.77.down_proj", "model.layers.70.mlp.experts.78.down_proj", "model.layers.70.mlp.experts.79.down_proj", "model.layers.70.mlp.experts.80.down_proj", "model.layers.70.mlp.experts.81.down_proj", "model.layers.70.mlp.experts.82.down_proj", "model.layers.70.mlp.experts.83.down_proj", "model.layers.70.mlp.experts.84.down_proj", "model.layers.70.mlp.experts.85.down_proj", "model.layers.70.mlp.experts.86.down_proj", "model.layers.70.mlp.experts.87.down_proj", "model.layers.70.mlp.experts.88.down_proj", "model.layers.70.mlp.experts.89.down_proj", "model.layers.70.mlp.experts.90.down_proj", "model.layers.70.mlp.experts.91.down_proj", "model.layers.70.mlp.experts.92.down_proj", "model.layers.70.mlp.experts.93.down_proj", "model.layers.70.mlp.experts.94.down_proj", "model.layers.70.mlp.experts.95.down_proj", "model.layers.70.mlp.experts.96.down_proj", "model.layers.70.mlp.experts.97.down_proj", "model.layers.70.mlp.experts.98.down_proj", "model.layers.70.mlp.experts.99.down_proj", "model.layers.70.mlp.experts.100.down_proj", "model.layers.70.mlp.experts.101.down_proj", "model.layers.70.mlp.experts.102.down_proj", "model.layers.70.mlp.experts.103.down_proj", "model.layers.70.mlp.experts.104.down_proj", "model.layers.70.mlp.experts.105.down_proj", "model.layers.70.mlp.experts.106.down_proj", "model.layers.70.mlp.experts.107.down_proj", "model.layers.70.mlp.experts.108.down_proj", "model.layers.70.mlp.experts.109.down_proj", "model.layers.70.mlp.experts.110.down_proj", "model.layers.70.mlp.experts.111.down_proj", "model.layers.70.mlp.experts.112.down_proj", "model.layers.70.mlp.experts.113.down_proj", "model.layers.70.mlp.experts.114.down_proj", "model.layers.70.mlp.experts.115.down_proj", "model.layers.70.mlp.experts.116.down_proj", "model.layers.70.mlp.experts.117.down_proj", "model.layers.70.mlp.experts.118.down_proj", "model.layers.70.mlp.experts.119.down_proj", "model.layers.70.mlp.experts.120.down_proj", "model.layers.70.mlp.experts.121.down_proj", "model.layers.70.mlp.experts.122.down_proj", "model.layers.70.mlp.experts.123.down_proj", "model.layers.70.mlp.experts.124.down_proj", "model.layers.70.mlp.experts.125.down_proj", "model.layers.70.mlp.experts.126.down_proj", "model.layers.70.mlp.experts.127.down_proj", "model.layers.70.mlp.experts.128.down_proj", "model.layers.70.mlp.experts.129.down_proj", "model.layers.70.mlp.experts.130.down_proj", "model.layers.70.mlp.experts.131.down_proj", "model.layers.70.mlp.experts.132.down_proj", "model.layers.70.mlp.experts.133.down_proj", "model.layers.70.mlp.experts.134.down_proj", "model.layers.70.mlp.experts.135.down_proj", "model.layers.70.mlp.experts.136.down_proj", "model.layers.70.mlp.experts.137.down_proj", "model.layers.70.mlp.experts.138.down_proj", "model.layers.70.mlp.experts.139.down_proj", "model.layers.70.mlp.experts.140.down_proj", "model.layers.70.mlp.experts.141.down_proj", "model.layers.70.mlp.experts.142.down_proj", "model.layers.70.mlp.experts.143.down_proj", "model.layers.70.mlp.experts.144.down_proj", "model.layers.70.mlp.experts.145.down_proj", "model.layers.70.mlp.experts.146.down_proj", "model.layers.70.mlp.experts.147.down_proj", "model.layers.70.mlp.experts.148.down_proj", "model.layers.70.mlp.experts.149.down_proj", "model.layers.70.mlp.experts.150.down_proj", "model.layers.70.mlp.experts.151.down_proj", "model.layers.70.mlp.experts.152.down_proj", "model.layers.70.mlp.experts.153.down_proj", "model.layers.70.mlp.experts.154.down_proj", "model.layers.70.mlp.experts.155.down_proj", "model.layers.70.mlp.experts.156.down_proj", "model.layers.70.mlp.experts.157.down_proj", "model.layers.70.mlp.experts.158.down_proj", "model.layers.70.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -8.275872096417947e-06, "dbits": 1258291200 }, { "dkld": -1.4105997979640267e-05, "dbits": 2516582400 } ] }, { "idx": 423, "layers": [ "model.layers.71.self_attn.q_proj" ], "candidates": [ { "dkld": 3.19187063723813e-05, "dbits": 62914560 }, { "dkld": 3.415867686271806e-05, "dbits": 125829120 } ] }, { "idx": 424, "layers": [ "model.layers.71.self_attn.k_proj", "model.layers.71.self_attn.v_proj" ], "candidates": [ { "dkld": 1.5099439769983639e-05, "dbits": 10485760 }, { "dkld": -1.03986356407397e-05, "dbits": 20971520 } ] }, { "idx": 425, "layers": [ "model.layers.71.self_attn.o_proj" ], "candidates": [ { "dkld": -5.686702206729802e-06, "dbits": 62914560 }, { "dkld": -1.6122800298034798e-05, "dbits": 125829120 } ] }, { "idx": 426, "layers": [ "model.layers.71.mlp.shared_experts.gate_proj", "model.layers.71.mlp.shared_experts.up_proj", "model.layers.71.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -4.279571585357085e-05, "dbits": 23592960 }, { "dkld": -3.839742857962743e-05, "dbits": 47185920 } ] }, { "idx": 427, "layers": [ "model.layers.71.mlp.experts.0.gate_proj", "model.layers.71.mlp.experts.1.gate_proj", "model.layers.71.mlp.experts.2.gate_proj", "model.layers.71.mlp.experts.3.gate_proj", "model.layers.71.mlp.experts.4.gate_proj", "model.layers.71.mlp.experts.5.gate_proj", "model.layers.71.mlp.experts.6.gate_proj", "model.layers.71.mlp.experts.7.gate_proj", "model.layers.71.mlp.experts.8.gate_proj", "model.layers.71.mlp.experts.9.gate_proj", "model.layers.71.mlp.experts.10.gate_proj", "model.layers.71.mlp.experts.11.gate_proj", "model.layers.71.mlp.experts.12.gate_proj", "model.layers.71.mlp.experts.13.gate_proj", "model.layers.71.mlp.experts.14.gate_proj", "model.layers.71.mlp.experts.15.gate_proj", "model.layers.71.mlp.experts.16.gate_proj", "model.layers.71.mlp.experts.17.gate_proj", "model.layers.71.mlp.experts.18.gate_proj", "model.layers.71.mlp.experts.19.gate_proj", "model.layers.71.mlp.experts.20.gate_proj", "model.layers.71.mlp.experts.21.gate_proj", "model.layers.71.mlp.experts.22.gate_proj", "model.layers.71.mlp.experts.23.gate_proj", "model.layers.71.mlp.experts.24.gate_proj", "model.layers.71.mlp.experts.25.gate_proj", "model.layers.71.mlp.experts.26.gate_proj", "model.layers.71.mlp.experts.27.gate_proj", "model.layers.71.mlp.experts.28.gate_proj", "model.layers.71.mlp.experts.29.gate_proj", "model.layers.71.mlp.experts.30.gate_proj", "model.layers.71.mlp.experts.31.gate_proj", "model.layers.71.mlp.experts.32.gate_proj", "model.layers.71.mlp.experts.33.gate_proj", "model.layers.71.mlp.experts.34.gate_proj", "model.layers.71.mlp.experts.35.gate_proj", "model.layers.71.mlp.experts.36.gate_proj", "model.layers.71.mlp.experts.37.gate_proj", "model.layers.71.mlp.experts.38.gate_proj", "model.layers.71.mlp.experts.39.gate_proj", "model.layers.71.mlp.experts.40.gate_proj", "model.layers.71.mlp.experts.41.gate_proj", "model.layers.71.mlp.experts.42.gate_proj", "model.layers.71.mlp.experts.43.gate_proj", "model.layers.71.mlp.experts.44.gate_proj", "model.layers.71.mlp.experts.45.gate_proj", "model.layers.71.mlp.experts.46.gate_proj", "model.layers.71.mlp.experts.47.gate_proj", "model.layers.71.mlp.experts.48.gate_proj", "model.layers.71.mlp.experts.49.gate_proj", "model.layers.71.mlp.experts.50.gate_proj", "model.layers.71.mlp.experts.51.gate_proj", "model.layers.71.mlp.experts.52.gate_proj", "model.layers.71.mlp.experts.53.gate_proj", "model.layers.71.mlp.experts.54.gate_proj", "model.layers.71.mlp.experts.55.gate_proj", "model.layers.71.mlp.experts.56.gate_proj", "model.layers.71.mlp.experts.57.gate_proj", "model.layers.71.mlp.experts.58.gate_proj", "model.layers.71.mlp.experts.59.gate_proj", "model.layers.71.mlp.experts.60.gate_proj", "model.layers.71.mlp.experts.61.gate_proj", "model.layers.71.mlp.experts.62.gate_proj", "model.layers.71.mlp.experts.63.gate_proj", "model.layers.71.mlp.experts.64.gate_proj", "model.layers.71.mlp.experts.65.gate_proj", "model.layers.71.mlp.experts.66.gate_proj", "model.layers.71.mlp.experts.67.gate_proj", "model.layers.71.mlp.experts.68.gate_proj", "model.layers.71.mlp.experts.69.gate_proj", "model.layers.71.mlp.experts.70.gate_proj", "model.layers.71.mlp.experts.71.gate_proj", "model.layers.71.mlp.experts.72.gate_proj", "model.layers.71.mlp.experts.73.gate_proj", "model.layers.71.mlp.experts.74.gate_proj", "model.layers.71.mlp.experts.75.gate_proj", "model.layers.71.mlp.experts.76.gate_proj", "model.layers.71.mlp.experts.77.gate_proj", "model.layers.71.mlp.experts.78.gate_proj", "model.layers.71.mlp.experts.79.gate_proj", "model.layers.71.mlp.experts.80.gate_proj", "model.layers.71.mlp.experts.81.gate_proj", "model.layers.71.mlp.experts.82.gate_proj", "model.layers.71.mlp.experts.83.gate_proj", "model.layers.71.mlp.experts.84.gate_proj", "model.layers.71.mlp.experts.85.gate_proj", "model.layers.71.mlp.experts.86.gate_proj", "model.layers.71.mlp.experts.87.gate_proj", "model.layers.71.mlp.experts.88.gate_proj", "model.layers.71.mlp.experts.89.gate_proj", "model.layers.71.mlp.experts.90.gate_proj", "model.layers.71.mlp.experts.91.gate_proj", "model.layers.71.mlp.experts.92.gate_proj", "model.layers.71.mlp.experts.93.gate_proj", "model.layers.71.mlp.experts.94.gate_proj", "model.layers.71.mlp.experts.95.gate_proj", "model.layers.71.mlp.experts.96.gate_proj", "model.layers.71.mlp.experts.97.gate_proj", "model.layers.71.mlp.experts.98.gate_proj", "model.layers.71.mlp.experts.99.gate_proj", "model.layers.71.mlp.experts.100.gate_proj", "model.layers.71.mlp.experts.101.gate_proj", "model.layers.71.mlp.experts.102.gate_proj", "model.layers.71.mlp.experts.103.gate_proj", "model.layers.71.mlp.experts.104.gate_proj", "model.layers.71.mlp.experts.105.gate_proj", "model.layers.71.mlp.experts.106.gate_proj", "model.layers.71.mlp.experts.107.gate_proj", "model.layers.71.mlp.experts.108.gate_proj", "model.layers.71.mlp.experts.109.gate_proj", "model.layers.71.mlp.experts.110.gate_proj", "model.layers.71.mlp.experts.111.gate_proj", "model.layers.71.mlp.experts.112.gate_proj", "model.layers.71.mlp.experts.113.gate_proj", "model.layers.71.mlp.experts.114.gate_proj", "model.layers.71.mlp.experts.115.gate_proj", "model.layers.71.mlp.experts.116.gate_proj", "model.layers.71.mlp.experts.117.gate_proj", "model.layers.71.mlp.experts.118.gate_proj", "model.layers.71.mlp.experts.119.gate_proj", "model.layers.71.mlp.experts.120.gate_proj", "model.layers.71.mlp.experts.121.gate_proj", "model.layers.71.mlp.experts.122.gate_proj", "model.layers.71.mlp.experts.123.gate_proj", "model.layers.71.mlp.experts.124.gate_proj", "model.layers.71.mlp.experts.125.gate_proj", "model.layers.71.mlp.experts.126.gate_proj", "model.layers.71.mlp.experts.127.gate_proj", "model.layers.71.mlp.experts.128.gate_proj", "model.layers.71.mlp.experts.129.gate_proj", "model.layers.71.mlp.experts.130.gate_proj", "model.layers.71.mlp.experts.131.gate_proj", "model.layers.71.mlp.experts.132.gate_proj", "model.layers.71.mlp.experts.133.gate_proj", "model.layers.71.mlp.experts.134.gate_proj", "model.layers.71.mlp.experts.135.gate_proj", "model.layers.71.mlp.experts.136.gate_proj", "model.layers.71.mlp.experts.137.gate_proj", "model.layers.71.mlp.experts.138.gate_proj", "model.layers.71.mlp.experts.139.gate_proj", "model.layers.71.mlp.experts.140.gate_proj", "model.layers.71.mlp.experts.141.gate_proj", "model.layers.71.mlp.experts.142.gate_proj", "model.layers.71.mlp.experts.143.gate_proj", "model.layers.71.mlp.experts.144.gate_proj", "model.layers.71.mlp.experts.145.gate_proj", "model.layers.71.mlp.experts.146.gate_proj", "model.layers.71.mlp.experts.147.gate_proj", "model.layers.71.mlp.experts.148.gate_proj", "model.layers.71.mlp.experts.149.gate_proj", "model.layers.71.mlp.experts.150.gate_proj", "model.layers.71.mlp.experts.151.gate_proj", "model.layers.71.mlp.experts.152.gate_proj", "model.layers.71.mlp.experts.153.gate_proj", "model.layers.71.mlp.experts.154.gate_proj", "model.layers.71.mlp.experts.155.gate_proj", "model.layers.71.mlp.experts.156.gate_proj", "model.layers.71.mlp.experts.157.gate_proj", "model.layers.71.mlp.experts.158.gate_proj", "model.layers.71.mlp.experts.159.gate_proj", "model.layers.71.mlp.experts.0.up_proj", "model.layers.71.mlp.experts.1.up_proj", "model.layers.71.mlp.experts.2.up_proj", "model.layers.71.mlp.experts.3.up_proj", "model.layers.71.mlp.experts.4.up_proj", "model.layers.71.mlp.experts.5.up_proj", "model.layers.71.mlp.experts.6.up_proj", "model.layers.71.mlp.experts.7.up_proj", "model.layers.71.mlp.experts.8.up_proj", "model.layers.71.mlp.experts.9.up_proj", "model.layers.71.mlp.experts.10.up_proj", "model.layers.71.mlp.experts.11.up_proj", "model.layers.71.mlp.experts.12.up_proj", "model.layers.71.mlp.experts.13.up_proj", "model.layers.71.mlp.experts.14.up_proj", "model.layers.71.mlp.experts.15.up_proj", "model.layers.71.mlp.experts.16.up_proj", "model.layers.71.mlp.experts.17.up_proj", "model.layers.71.mlp.experts.18.up_proj", "model.layers.71.mlp.experts.19.up_proj", "model.layers.71.mlp.experts.20.up_proj", "model.layers.71.mlp.experts.21.up_proj", "model.layers.71.mlp.experts.22.up_proj", "model.layers.71.mlp.experts.23.up_proj", "model.layers.71.mlp.experts.24.up_proj", "model.layers.71.mlp.experts.25.up_proj", "model.layers.71.mlp.experts.26.up_proj", "model.layers.71.mlp.experts.27.up_proj", "model.layers.71.mlp.experts.28.up_proj", "model.layers.71.mlp.experts.29.up_proj", "model.layers.71.mlp.experts.30.up_proj", "model.layers.71.mlp.experts.31.up_proj", "model.layers.71.mlp.experts.32.up_proj", "model.layers.71.mlp.experts.33.up_proj", "model.layers.71.mlp.experts.34.up_proj", "model.layers.71.mlp.experts.35.up_proj", "model.layers.71.mlp.experts.36.up_proj", "model.layers.71.mlp.experts.37.up_proj", "model.layers.71.mlp.experts.38.up_proj", "model.layers.71.mlp.experts.39.up_proj", "model.layers.71.mlp.experts.40.up_proj", "model.layers.71.mlp.experts.41.up_proj", "model.layers.71.mlp.experts.42.up_proj", "model.layers.71.mlp.experts.43.up_proj", "model.layers.71.mlp.experts.44.up_proj", "model.layers.71.mlp.experts.45.up_proj", "model.layers.71.mlp.experts.46.up_proj", "model.layers.71.mlp.experts.47.up_proj", "model.layers.71.mlp.experts.48.up_proj", "model.layers.71.mlp.experts.49.up_proj", "model.layers.71.mlp.experts.50.up_proj", "model.layers.71.mlp.experts.51.up_proj", "model.layers.71.mlp.experts.52.up_proj", "model.layers.71.mlp.experts.53.up_proj", "model.layers.71.mlp.experts.54.up_proj", "model.layers.71.mlp.experts.55.up_proj", "model.layers.71.mlp.experts.56.up_proj", "model.layers.71.mlp.experts.57.up_proj", "model.layers.71.mlp.experts.58.up_proj", "model.layers.71.mlp.experts.59.up_proj", "model.layers.71.mlp.experts.60.up_proj", "model.layers.71.mlp.experts.61.up_proj", "model.layers.71.mlp.experts.62.up_proj", "model.layers.71.mlp.experts.63.up_proj", "model.layers.71.mlp.experts.64.up_proj", "model.layers.71.mlp.experts.65.up_proj", "model.layers.71.mlp.experts.66.up_proj", "model.layers.71.mlp.experts.67.up_proj", "model.layers.71.mlp.experts.68.up_proj", "model.layers.71.mlp.experts.69.up_proj", "model.layers.71.mlp.experts.70.up_proj", "model.layers.71.mlp.experts.71.up_proj", "model.layers.71.mlp.experts.72.up_proj", "model.layers.71.mlp.experts.73.up_proj", "model.layers.71.mlp.experts.74.up_proj", "model.layers.71.mlp.experts.75.up_proj", "model.layers.71.mlp.experts.76.up_proj", "model.layers.71.mlp.experts.77.up_proj", "model.layers.71.mlp.experts.78.up_proj", "model.layers.71.mlp.experts.79.up_proj", "model.layers.71.mlp.experts.80.up_proj", "model.layers.71.mlp.experts.81.up_proj", "model.layers.71.mlp.experts.82.up_proj", "model.layers.71.mlp.experts.83.up_proj", "model.layers.71.mlp.experts.84.up_proj", "model.layers.71.mlp.experts.85.up_proj", "model.layers.71.mlp.experts.86.up_proj", "model.layers.71.mlp.experts.87.up_proj", "model.layers.71.mlp.experts.88.up_proj", "model.layers.71.mlp.experts.89.up_proj", "model.layers.71.mlp.experts.90.up_proj", "model.layers.71.mlp.experts.91.up_proj", "model.layers.71.mlp.experts.92.up_proj", "model.layers.71.mlp.experts.93.up_proj", "model.layers.71.mlp.experts.94.up_proj", "model.layers.71.mlp.experts.95.up_proj", "model.layers.71.mlp.experts.96.up_proj", "model.layers.71.mlp.experts.97.up_proj", "model.layers.71.mlp.experts.98.up_proj", "model.layers.71.mlp.experts.99.up_proj", "model.layers.71.mlp.experts.100.up_proj", "model.layers.71.mlp.experts.101.up_proj", "model.layers.71.mlp.experts.102.up_proj", "model.layers.71.mlp.experts.103.up_proj", "model.layers.71.mlp.experts.104.up_proj", "model.layers.71.mlp.experts.105.up_proj", "model.layers.71.mlp.experts.106.up_proj", "model.layers.71.mlp.experts.107.up_proj", "model.layers.71.mlp.experts.108.up_proj", "model.layers.71.mlp.experts.109.up_proj", "model.layers.71.mlp.experts.110.up_proj", "model.layers.71.mlp.experts.111.up_proj", "model.layers.71.mlp.experts.112.up_proj", "model.layers.71.mlp.experts.113.up_proj", "model.layers.71.mlp.experts.114.up_proj", "model.layers.71.mlp.experts.115.up_proj", "model.layers.71.mlp.experts.116.up_proj", "model.layers.71.mlp.experts.117.up_proj", "model.layers.71.mlp.experts.118.up_proj", "model.layers.71.mlp.experts.119.up_proj", "model.layers.71.mlp.experts.120.up_proj", "model.layers.71.mlp.experts.121.up_proj", "model.layers.71.mlp.experts.122.up_proj", "model.layers.71.mlp.experts.123.up_proj", "model.layers.71.mlp.experts.124.up_proj", "model.layers.71.mlp.experts.125.up_proj", "model.layers.71.mlp.experts.126.up_proj", "model.layers.71.mlp.experts.127.up_proj", "model.layers.71.mlp.experts.128.up_proj", "model.layers.71.mlp.experts.129.up_proj", "model.layers.71.mlp.experts.130.up_proj", "model.layers.71.mlp.experts.131.up_proj", "model.layers.71.mlp.experts.132.up_proj", "model.layers.71.mlp.experts.133.up_proj", "model.layers.71.mlp.experts.134.up_proj", "model.layers.71.mlp.experts.135.up_proj", "model.layers.71.mlp.experts.136.up_proj", "model.layers.71.mlp.experts.137.up_proj", "model.layers.71.mlp.experts.138.up_proj", "model.layers.71.mlp.experts.139.up_proj", "model.layers.71.mlp.experts.140.up_proj", "model.layers.71.mlp.experts.141.up_proj", "model.layers.71.mlp.experts.142.up_proj", "model.layers.71.mlp.experts.143.up_proj", "model.layers.71.mlp.experts.144.up_proj", "model.layers.71.mlp.experts.145.up_proj", "model.layers.71.mlp.experts.146.up_proj", "model.layers.71.mlp.experts.147.up_proj", "model.layers.71.mlp.experts.148.up_proj", "model.layers.71.mlp.experts.149.up_proj", "model.layers.71.mlp.experts.150.up_proj", "model.layers.71.mlp.experts.151.up_proj", "model.layers.71.mlp.experts.152.up_proj", "model.layers.71.mlp.experts.153.up_proj", "model.layers.71.mlp.experts.154.up_proj", "model.layers.71.mlp.experts.155.up_proj", "model.layers.71.mlp.experts.156.up_proj", "model.layers.71.mlp.experts.157.up_proj", "model.layers.71.mlp.experts.158.up_proj", "model.layers.71.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -2.8263917192815347e-05, "dbits": 2516582400 }, { "dkld": -1.82484276592728e-05, "dbits": 5033164800 } ] }, { "idx": 428, "layers": [ "model.layers.71.mlp.experts.0.down_proj", "model.layers.71.mlp.experts.1.down_proj", "model.layers.71.mlp.experts.2.down_proj", "model.layers.71.mlp.experts.3.down_proj", "model.layers.71.mlp.experts.4.down_proj", "model.layers.71.mlp.experts.5.down_proj", "model.layers.71.mlp.experts.6.down_proj", "model.layers.71.mlp.experts.7.down_proj", "model.layers.71.mlp.experts.8.down_proj", "model.layers.71.mlp.experts.9.down_proj", "model.layers.71.mlp.experts.10.down_proj", "model.layers.71.mlp.experts.11.down_proj", "model.layers.71.mlp.experts.12.down_proj", "model.layers.71.mlp.experts.13.down_proj", "model.layers.71.mlp.experts.14.down_proj", "model.layers.71.mlp.experts.15.down_proj", "model.layers.71.mlp.experts.16.down_proj", "model.layers.71.mlp.experts.17.down_proj", "model.layers.71.mlp.experts.18.down_proj", "model.layers.71.mlp.experts.19.down_proj", "model.layers.71.mlp.experts.20.down_proj", "model.layers.71.mlp.experts.21.down_proj", "model.layers.71.mlp.experts.22.down_proj", "model.layers.71.mlp.experts.23.down_proj", "model.layers.71.mlp.experts.24.down_proj", "model.layers.71.mlp.experts.25.down_proj", "model.layers.71.mlp.experts.26.down_proj", "model.layers.71.mlp.experts.27.down_proj", "model.layers.71.mlp.experts.28.down_proj", "model.layers.71.mlp.experts.29.down_proj", "model.layers.71.mlp.experts.30.down_proj", "model.layers.71.mlp.experts.31.down_proj", "model.layers.71.mlp.experts.32.down_proj", "model.layers.71.mlp.experts.33.down_proj", "model.layers.71.mlp.experts.34.down_proj", "model.layers.71.mlp.experts.35.down_proj", "model.layers.71.mlp.experts.36.down_proj", "model.layers.71.mlp.experts.37.down_proj", "model.layers.71.mlp.experts.38.down_proj", "model.layers.71.mlp.experts.39.down_proj", "model.layers.71.mlp.experts.40.down_proj", "model.layers.71.mlp.experts.41.down_proj", "model.layers.71.mlp.experts.42.down_proj", "model.layers.71.mlp.experts.43.down_proj", "model.layers.71.mlp.experts.44.down_proj", "model.layers.71.mlp.experts.45.down_proj", "model.layers.71.mlp.experts.46.down_proj", "model.layers.71.mlp.experts.47.down_proj", "model.layers.71.mlp.experts.48.down_proj", "model.layers.71.mlp.experts.49.down_proj", "model.layers.71.mlp.experts.50.down_proj", "model.layers.71.mlp.experts.51.down_proj", "model.layers.71.mlp.experts.52.down_proj", "model.layers.71.mlp.experts.53.down_proj", "model.layers.71.mlp.experts.54.down_proj", "model.layers.71.mlp.experts.55.down_proj", "model.layers.71.mlp.experts.56.down_proj", "model.layers.71.mlp.experts.57.down_proj", "model.layers.71.mlp.experts.58.down_proj", "model.layers.71.mlp.experts.59.down_proj", "model.layers.71.mlp.experts.60.down_proj", "model.layers.71.mlp.experts.61.down_proj", "model.layers.71.mlp.experts.62.down_proj", "model.layers.71.mlp.experts.63.down_proj", "model.layers.71.mlp.experts.64.down_proj", "model.layers.71.mlp.experts.65.down_proj", "model.layers.71.mlp.experts.66.down_proj", "model.layers.71.mlp.experts.67.down_proj", "model.layers.71.mlp.experts.68.down_proj", "model.layers.71.mlp.experts.69.down_proj", "model.layers.71.mlp.experts.70.down_proj", "model.layers.71.mlp.experts.71.down_proj", "model.layers.71.mlp.experts.72.down_proj", "model.layers.71.mlp.experts.73.down_proj", "model.layers.71.mlp.experts.74.down_proj", "model.layers.71.mlp.experts.75.down_proj", "model.layers.71.mlp.experts.76.down_proj", "model.layers.71.mlp.experts.77.down_proj", "model.layers.71.mlp.experts.78.down_proj", "model.layers.71.mlp.experts.79.down_proj", "model.layers.71.mlp.experts.80.down_proj", "model.layers.71.mlp.experts.81.down_proj", "model.layers.71.mlp.experts.82.down_proj", "model.layers.71.mlp.experts.83.down_proj", "model.layers.71.mlp.experts.84.down_proj", "model.layers.71.mlp.experts.85.down_proj", "model.layers.71.mlp.experts.86.down_proj", "model.layers.71.mlp.experts.87.down_proj", "model.layers.71.mlp.experts.88.down_proj", "model.layers.71.mlp.experts.89.down_proj", "model.layers.71.mlp.experts.90.down_proj", "model.layers.71.mlp.experts.91.down_proj", "model.layers.71.mlp.experts.92.down_proj", "model.layers.71.mlp.experts.93.down_proj", "model.layers.71.mlp.experts.94.down_proj", "model.layers.71.mlp.experts.95.down_proj", "model.layers.71.mlp.experts.96.down_proj", "model.layers.71.mlp.experts.97.down_proj", "model.layers.71.mlp.experts.98.down_proj", "model.layers.71.mlp.experts.99.down_proj", "model.layers.71.mlp.experts.100.down_proj", "model.layers.71.mlp.experts.101.down_proj", "model.layers.71.mlp.experts.102.down_proj", "model.layers.71.mlp.experts.103.down_proj", "model.layers.71.mlp.experts.104.down_proj", "model.layers.71.mlp.experts.105.down_proj", "model.layers.71.mlp.experts.106.down_proj", "model.layers.71.mlp.experts.107.down_proj", "model.layers.71.mlp.experts.108.down_proj", "model.layers.71.mlp.experts.109.down_proj", "model.layers.71.mlp.experts.110.down_proj", "model.layers.71.mlp.experts.111.down_proj", "model.layers.71.mlp.experts.112.down_proj", "model.layers.71.mlp.experts.113.down_proj", "model.layers.71.mlp.experts.114.down_proj", "model.layers.71.mlp.experts.115.down_proj", "model.layers.71.mlp.experts.116.down_proj", "model.layers.71.mlp.experts.117.down_proj", "model.layers.71.mlp.experts.118.down_proj", "model.layers.71.mlp.experts.119.down_proj", "model.layers.71.mlp.experts.120.down_proj", "model.layers.71.mlp.experts.121.down_proj", "model.layers.71.mlp.experts.122.down_proj", "model.layers.71.mlp.experts.123.down_proj", "model.layers.71.mlp.experts.124.down_proj", "model.layers.71.mlp.experts.125.down_proj", "model.layers.71.mlp.experts.126.down_proj", "model.layers.71.mlp.experts.127.down_proj", "model.layers.71.mlp.experts.128.down_proj", "model.layers.71.mlp.experts.129.down_proj", "model.layers.71.mlp.experts.130.down_proj", "model.layers.71.mlp.experts.131.down_proj", "model.layers.71.mlp.experts.132.down_proj", "model.layers.71.mlp.experts.133.down_proj", "model.layers.71.mlp.experts.134.down_proj", "model.layers.71.mlp.experts.135.down_proj", "model.layers.71.mlp.experts.136.down_proj", "model.layers.71.mlp.experts.137.down_proj", "model.layers.71.mlp.experts.138.down_proj", "model.layers.71.mlp.experts.139.down_proj", "model.layers.71.mlp.experts.140.down_proj", "model.layers.71.mlp.experts.141.down_proj", "model.layers.71.mlp.experts.142.down_proj", "model.layers.71.mlp.experts.143.down_proj", "model.layers.71.mlp.experts.144.down_proj", "model.layers.71.mlp.experts.145.down_proj", "model.layers.71.mlp.experts.146.down_proj", "model.layers.71.mlp.experts.147.down_proj", "model.layers.71.mlp.experts.148.down_proj", "model.layers.71.mlp.experts.149.down_proj", "model.layers.71.mlp.experts.150.down_proj", "model.layers.71.mlp.experts.151.down_proj", "model.layers.71.mlp.experts.152.down_proj", "model.layers.71.mlp.experts.153.down_proj", "model.layers.71.mlp.experts.154.down_proj", "model.layers.71.mlp.experts.155.down_proj", "model.layers.71.mlp.experts.156.down_proj", "model.layers.71.mlp.experts.157.down_proj", "model.layers.71.mlp.experts.158.down_proj", "model.layers.71.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.3122644051909447e-05, "dbits": 1258291200 }, { "dkld": -2.1907570771872303e-05, "dbits": 2516582400 } ] }, { "idx": 429, "layers": [ "model.layers.72.self_attn.q_proj" ], "candidates": [ { "dkld": 5.119456909598308e-06, "dbits": 62914560 }, { "dkld": 8.85652843862772e-06, "dbits": 125829120 } ] }, { "idx": 430, "layers": [ "model.layers.72.self_attn.k_proj", "model.layers.72.self_attn.v_proj" ], "candidates": [ { "dkld": -4.176981747150421e-07, "dbits": 10485760 }, { "dkld": -2.4217180907726288e-05, "dbits": 20971520 } ] }, { "idx": 431, "layers": [ "model.layers.72.self_attn.o_proj" ], "candidates": [ { "dkld": -1.748728100210359e-05, "dbits": 62914560 }, { "dkld": -2.4639209732411904e-05, "dbits": 125829120 } ] }, { "idx": 432, "layers": [ "model.layers.72.mlp.shared_experts.gate_proj", "model.layers.72.mlp.shared_experts.up_proj", "model.layers.72.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -2.2846017964183937e-05, "dbits": 23592960 }, { "dkld": -1.6636215150345884e-06, "dbits": 47185920 } ] }, { "idx": 433, "layers": [ "model.layers.72.mlp.experts.0.gate_proj", "model.layers.72.mlp.experts.1.gate_proj", "model.layers.72.mlp.experts.2.gate_proj", "model.layers.72.mlp.experts.3.gate_proj", "model.layers.72.mlp.experts.4.gate_proj", "model.layers.72.mlp.experts.5.gate_proj", "model.layers.72.mlp.experts.6.gate_proj", "model.layers.72.mlp.experts.7.gate_proj", "model.layers.72.mlp.experts.8.gate_proj", "model.layers.72.mlp.experts.9.gate_proj", "model.layers.72.mlp.experts.10.gate_proj", "model.layers.72.mlp.experts.11.gate_proj", "model.layers.72.mlp.experts.12.gate_proj", "model.layers.72.mlp.experts.13.gate_proj", "model.layers.72.mlp.experts.14.gate_proj", "model.layers.72.mlp.experts.15.gate_proj", "model.layers.72.mlp.experts.16.gate_proj", "model.layers.72.mlp.experts.17.gate_proj", "model.layers.72.mlp.experts.18.gate_proj", "model.layers.72.mlp.experts.19.gate_proj", "model.layers.72.mlp.experts.20.gate_proj", "model.layers.72.mlp.experts.21.gate_proj", "model.layers.72.mlp.experts.22.gate_proj", "model.layers.72.mlp.experts.23.gate_proj", "model.layers.72.mlp.experts.24.gate_proj", "model.layers.72.mlp.experts.25.gate_proj", "model.layers.72.mlp.experts.26.gate_proj", "model.layers.72.mlp.experts.27.gate_proj", "model.layers.72.mlp.experts.28.gate_proj", "model.layers.72.mlp.experts.29.gate_proj", "model.layers.72.mlp.experts.30.gate_proj", "model.layers.72.mlp.experts.31.gate_proj", "model.layers.72.mlp.experts.32.gate_proj", "model.layers.72.mlp.experts.33.gate_proj", "model.layers.72.mlp.experts.34.gate_proj", "model.layers.72.mlp.experts.35.gate_proj", "model.layers.72.mlp.experts.36.gate_proj", "model.layers.72.mlp.experts.37.gate_proj", "model.layers.72.mlp.experts.38.gate_proj", "model.layers.72.mlp.experts.39.gate_proj", "model.layers.72.mlp.experts.40.gate_proj", "model.layers.72.mlp.experts.41.gate_proj", "model.layers.72.mlp.experts.42.gate_proj", "model.layers.72.mlp.experts.43.gate_proj", "model.layers.72.mlp.experts.44.gate_proj", "model.layers.72.mlp.experts.45.gate_proj", "model.layers.72.mlp.experts.46.gate_proj", "model.layers.72.mlp.experts.47.gate_proj", "model.layers.72.mlp.experts.48.gate_proj", "model.layers.72.mlp.experts.49.gate_proj", "model.layers.72.mlp.experts.50.gate_proj", "model.layers.72.mlp.experts.51.gate_proj", "model.layers.72.mlp.experts.52.gate_proj", "model.layers.72.mlp.experts.53.gate_proj", "model.layers.72.mlp.experts.54.gate_proj", "model.layers.72.mlp.experts.55.gate_proj", "model.layers.72.mlp.experts.56.gate_proj", "model.layers.72.mlp.experts.57.gate_proj", "model.layers.72.mlp.experts.58.gate_proj", "model.layers.72.mlp.experts.59.gate_proj", "model.layers.72.mlp.experts.60.gate_proj", "model.layers.72.mlp.experts.61.gate_proj", "model.layers.72.mlp.experts.62.gate_proj", "model.layers.72.mlp.experts.63.gate_proj", "model.layers.72.mlp.experts.64.gate_proj", "model.layers.72.mlp.experts.65.gate_proj", "model.layers.72.mlp.experts.66.gate_proj", "model.layers.72.mlp.experts.67.gate_proj", "model.layers.72.mlp.experts.68.gate_proj", "model.layers.72.mlp.experts.69.gate_proj", "model.layers.72.mlp.experts.70.gate_proj", "model.layers.72.mlp.experts.71.gate_proj", "model.layers.72.mlp.experts.72.gate_proj", "model.layers.72.mlp.experts.73.gate_proj", "model.layers.72.mlp.experts.74.gate_proj", "model.layers.72.mlp.experts.75.gate_proj", "model.layers.72.mlp.experts.76.gate_proj", "model.layers.72.mlp.experts.77.gate_proj", "model.layers.72.mlp.experts.78.gate_proj", "model.layers.72.mlp.experts.79.gate_proj", "model.layers.72.mlp.experts.80.gate_proj", "model.layers.72.mlp.experts.81.gate_proj", "model.layers.72.mlp.experts.82.gate_proj", "model.layers.72.mlp.experts.83.gate_proj", "model.layers.72.mlp.experts.84.gate_proj", "model.layers.72.mlp.experts.85.gate_proj", "model.layers.72.mlp.experts.86.gate_proj", "model.layers.72.mlp.experts.87.gate_proj", "model.layers.72.mlp.experts.88.gate_proj", "model.layers.72.mlp.experts.89.gate_proj", "model.layers.72.mlp.experts.90.gate_proj", "model.layers.72.mlp.experts.91.gate_proj", "model.layers.72.mlp.experts.92.gate_proj", "model.layers.72.mlp.experts.93.gate_proj", "model.layers.72.mlp.experts.94.gate_proj", "model.layers.72.mlp.experts.95.gate_proj", "model.layers.72.mlp.experts.96.gate_proj", "model.layers.72.mlp.experts.97.gate_proj", "model.layers.72.mlp.experts.98.gate_proj", "model.layers.72.mlp.experts.99.gate_proj", "model.layers.72.mlp.experts.100.gate_proj", "model.layers.72.mlp.experts.101.gate_proj", "model.layers.72.mlp.experts.102.gate_proj", "model.layers.72.mlp.experts.103.gate_proj", "model.layers.72.mlp.experts.104.gate_proj", "model.layers.72.mlp.experts.105.gate_proj", "model.layers.72.mlp.experts.106.gate_proj", "model.layers.72.mlp.experts.107.gate_proj", "model.layers.72.mlp.experts.108.gate_proj", "model.layers.72.mlp.experts.109.gate_proj", "model.layers.72.mlp.experts.110.gate_proj", "model.layers.72.mlp.experts.111.gate_proj", "model.layers.72.mlp.experts.112.gate_proj", "model.layers.72.mlp.experts.113.gate_proj", "model.layers.72.mlp.experts.114.gate_proj", "model.layers.72.mlp.experts.115.gate_proj", "model.layers.72.mlp.experts.116.gate_proj", "model.layers.72.mlp.experts.117.gate_proj", "model.layers.72.mlp.experts.118.gate_proj", "model.layers.72.mlp.experts.119.gate_proj", "model.layers.72.mlp.experts.120.gate_proj", "model.layers.72.mlp.experts.121.gate_proj", "model.layers.72.mlp.experts.122.gate_proj", "model.layers.72.mlp.experts.123.gate_proj", "model.layers.72.mlp.experts.124.gate_proj", "model.layers.72.mlp.experts.125.gate_proj", "model.layers.72.mlp.experts.126.gate_proj", "model.layers.72.mlp.experts.127.gate_proj", "model.layers.72.mlp.experts.128.gate_proj", "model.layers.72.mlp.experts.129.gate_proj", "model.layers.72.mlp.experts.130.gate_proj", "model.layers.72.mlp.experts.131.gate_proj", "model.layers.72.mlp.experts.132.gate_proj", "model.layers.72.mlp.experts.133.gate_proj", "model.layers.72.mlp.experts.134.gate_proj", "model.layers.72.mlp.experts.135.gate_proj", "model.layers.72.mlp.experts.136.gate_proj", "model.layers.72.mlp.experts.137.gate_proj", "model.layers.72.mlp.experts.138.gate_proj", "model.layers.72.mlp.experts.139.gate_proj", "model.layers.72.mlp.experts.140.gate_proj", "model.layers.72.mlp.experts.141.gate_proj", "model.layers.72.mlp.experts.142.gate_proj", "model.layers.72.mlp.experts.143.gate_proj", "model.layers.72.mlp.experts.144.gate_proj", "model.layers.72.mlp.experts.145.gate_proj", "model.layers.72.mlp.experts.146.gate_proj", "model.layers.72.mlp.experts.147.gate_proj", "model.layers.72.mlp.experts.148.gate_proj", "model.layers.72.mlp.experts.149.gate_proj", "model.layers.72.mlp.experts.150.gate_proj", "model.layers.72.mlp.experts.151.gate_proj", "model.layers.72.mlp.experts.152.gate_proj", "model.layers.72.mlp.experts.153.gate_proj", "model.layers.72.mlp.experts.154.gate_proj", "model.layers.72.mlp.experts.155.gate_proj", "model.layers.72.mlp.experts.156.gate_proj", "model.layers.72.mlp.experts.157.gate_proj", "model.layers.72.mlp.experts.158.gate_proj", "model.layers.72.mlp.experts.159.gate_proj", "model.layers.72.mlp.experts.0.up_proj", "model.layers.72.mlp.experts.1.up_proj", "model.layers.72.mlp.experts.2.up_proj", "model.layers.72.mlp.experts.3.up_proj", "model.layers.72.mlp.experts.4.up_proj", "model.layers.72.mlp.experts.5.up_proj", "model.layers.72.mlp.experts.6.up_proj", "model.layers.72.mlp.experts.7.up_proj", "model.layers.72.mlp.experts.8.up_proj", "model.layers.72.mlp.experts.9.up_proj", "model.layers.72.mlp.experts.10.up_proj", "model.layers.72.mlp.experts.11.up_proj", "model.layers.72.mlp.experts.12.up_proj", "model.layers.72.mlp.experts.13.up_proj", "model.layers.72.mlp.experts.14.up_proj", "model.layers.72.mlp.experts.15.up_proj", "model.layers.72.mlp.experts.16.up_proj", "model.layers.72.mlp.experts.17.up_proj", "model.layers.72.mlp.experts.18.up_proj", "model.layers.72.mlp.experts.19.up_proj", "model.layers.72.mlp.experts.20.up_proj", "model.layers.72.mlp.experts.21.up_proj", "model.layers.72.mlp.experts.22.up_proj", "model.layers.72.mlp.experts.23.up_proj", "model.layers.72.mlp.experts.24.up_proj", "model.layers.72.mlp.experts.25.up_proj", "model.layers.72.mlp.experts.26.up_proj", "model.layers.72.mlp.experts.27.up_proj", "model.layers.72.mlp.experts.28.up_proj", "model.layers.72.mlp.experts.29.up_proj", "model.layers.72.mlp.experts.30.up_proj", "model.layers.72.mlp.experts.31.up_proj", "model.layers.72.mlp.experts.32.up_proj", "model.layers.72.mlp.experts.33.up_proj", "model.layers.72.mlp.experts.34.up_proj", "model.layers.72.mlp.experts.35.up_proj", "model.layers.72.mlp.experts.36.up_proj", "model.layers.72.mlp.experts.37.up_proj", "model.layers.72.mlp.experts.38.up_proj", "model.layers.72.mlp.experts.39.up_proj", "model.layers.72.mlp.experts.40.up_proj", "model.layers.72.mlp.experts.41.up_proj", "model.layers.72.mlp.experts.42.up_proj", "model.layers.72.mlp.experts.43.up_proj", "model.layers.72.mlp.experts.44.up_proj", "model.layers.72.mlp.experts.45.up_proj", "model.layers.72.mlp.experts.46.up_proj", "model.layers.72.mlp.experts.47.up_proj", "model.layers.72.mlp.experts.48.up_proj", "model.layers.72.mlp.experts.49.up_proj", "model.layers.72.mlp.experts.50.up_proj", "model.layers.72.mlp.experts.51.up_proj", "model.layers.72.mlp.experts.52.up_proj", "model.layers.72.mlp.experts.53.up_proj", "model.layers.72.mlp.experts.54.up_proj", "model.layers.72.mlp.experts.55.up_proj", "model.layers.72.mlp.experts.56.up_proj", "model.layers.72.mlp.experts.57.up_proj", "model.layers.72.mlp.experts.58.up_proj", "model.layers.72.mlp.experts.59.up_proj", "model.layers.72.mlp.experts.60.up_proj", "model.layers.72.mlp.experts.61.up_proj", "model.layers.72.mlp.experts.62.up_proj", "model.layers.72.mlp.experts.63.up_proj", "model.layers.72.mlp.experts.64.up_proj", "model.layers.72.mlp.experts.65.up_proj", "model.layers.72.mlp.experts.66.up_proj", "model.layers.72.mlp.experts.67.up_proj", "model.layers.72.mlp.experts.68.up_proj", "model.layers.72.mlp.experts.69.up_proj", "model.layers.72.mlp.experts.70.up_proj", "model.layers.72.mlp.experts.71.up_proj", "model.layers.72.mlp.experts.72.up_proj", "model.layers.72.mlp.experts.73.up_proj", "model.layers.72.mlp.experts.74.up_proj", "model.layers.72.mlp.experts.75.up_proj", "model.layers.72.mlp.experts.76.up_proj", "model.layers.72.mlp.experts.77.up_proj", "model.layers.72.mlp.experts.78.up_proj", "model.layers.72.mlp.experts.79.up_proj", "model.layers.72.mlp.experts.80.up_proj", "model.layers.72.mlp.experts.81.up_proj", "model.layers.72.mlp.experts.82.up_proj", "model.layers.72.mlp.experts.83.up_proj", "model.layers.72.mlp.experts.84.up_proj", "model.layers.72.mlp.experts.85.up_proj", "model.layers.72.mlp.experts.86.up_proj", "model.layers.72.mlp.experts.87.up_proj", "model.layers.72.mlp.experts.88.up_proj", "model.layers.72.mlp.experts.89.up_proj", "model.layers.72.mlp.experts.90.up_proj", "model.layers.72.mlp.experts.91.up_proj", "model.layers.72.mlp.experts.92.up_proj", "model.layers.72.mlp.experts.93.up_proj", "model.layers.72.mlp.experts.94.up_proj", "model.layers.72.mlp.experts.95.up_proj", "model.layers.72.mlp.experts.96.up_proj", "model.layers.72.mlp.experts.97.up_proj", "model.layers.72.mlp.experts.98.up_proj", "model.layers.72.mlp.experts.99.up_proj", "model.layers.72.mlp.experts.100.up_proj", "model.layers.72.mlp.experts.101.up_proj", "model.layers.72.mlp.experts.102.up_proj", "model.layers.72.mlp.experts.103.up_proj", "model.layers.72.mlp.experts.104.up_proj", "model.layers.72.mlp.experts.105.up_proj", "model.layers.72.mlp.experts.106.up_proj", "model.layers.72.mlp.experts.107.up_proj", "model.layers.72.mlp.experts.108.up_proj", "model.layers.72.mlp.experts.109.up_proj", "model.layers.72.mlp.experts.110.up_proj", "model.layers.72.mlp.experts.111.up_proj", "model.layers.72.mlp.experts.112.up_proj", "model.layers.72.mlp.experts.113.up_proj", "model.layers.72.mlp.experts.114.up_proj", "model.layers.72.mlp.experts.115.up_proj", "model.layers.72.mlp.experts.116.up_proj", "model.layers.72.mlp.experts.117.up_proj", "model.layers.72.mlp.experts.118.up_proj", "model.layers.72.mlp.experts.119.up_proj", "model.layers.72.mlp.experts.120.up_proj", "model.layers.72.mlp.experts.121.up_proj", "model.layers.72.mlp.experts.122.up_proj", "model.layers.72.mlp.experts.123.up_proj", "model.layers.72.mlp.experts.124.up_proj", "model.layers.72.mlp.experts.125.up_proj", "model.layers.72.mlp.experts.126.up_proj", "model.layers.72.mlp.experts.127.up_proj", "model.layers.72.mlp.experts.128.up_proj", "model.layers.72.mlp.experts.129.up_proj", "model.layers.72.mlp.experts.130.up_proj", "model.layers.72.mlp.experts.131.up_proj", "model.layers.72.mlp.experts.132.up_proj", "model.layers.72.mlp.experts.133.up_proj", "model.layers.72.mlp.experts.134.up_proj", "model.layers.72.mlp.experts.135.up_proj", "model.layers.72.mlp.experts.136.up_proj", "model.layers.72.mlp.experts.137.up_proj", "model.layers.72.mlp.experts.138.up_proj", "model.layers.72.mlp.experts.139.up_proj", "model.layers.72.mlp.experts.140.up_proj", "model.layers.72.mlp.experts.141.up_proj", "model.layers.72.mlp.experts.142.up_proj", "model.layers.72.mlp.experts.143.up_proj", "model.layers.72.mlp.experts.144.up_proj", "model.layers.72.mlp.experts.145.up_proj", "model.layers.72.mlp.experts.146.up_proj", "model.layers.72.mlp.experts.147.up_proj", "model.layers.72.mlp.experts.148.up_proj", "model.layers.72.mlp.experts.149.up_proj", "model.layers.72.mlp.experts.150.up_proj", "model.layers.72.mlp.experts.151.up_proj", "model.layers.72.mlp.experts.152.up_proj", "model.layers.72.mlp.experts.153.up_proj", "model.layers.72.mlp.experts.154.up_proj", "model.layers.72.mlp.experts.155.up_proj", "model.layers.72.mlp.experts.156.up_proj", "model.layers.72.mlp.experts.157.up_proj", "model.layers.72.mlp.experts.158.up_proj", "model.layers.72.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -4.015411250293116e-05, "dbits": 2516582400 }, { "dkld": -5.162453744560376e-05, "dbits": 5033164800 } ] }, { "idx": 434, "layers": [ "model.layers.72.mlp.experts.0.down_proj", "model.layers.72.mlp.experts.1.down_proj", "model.layers.72.mlp.experts.2.down_proj", "model.layers.72.mlp.experts.3.down_proj", "model.layers.72.mlp.experts.4.down_proj", "model.layers.72.mlp.experts.5.down_proj", "model.layers.72.mlp.experts.6.down_proj", "model.layers.72.mlp.experts.7.down_proj", "model.layers.72.mlp.experts.8.down_proj", "model.layers.72.mlp.experts.9.down_proj", "model.layers.72.mlp.experts.10.down_proj", "model.layers.72.mlp.experts.11.down_proj", "model.layers.72.mlp.experts.12.down_proj", "model.layers.72.mlp.experts.13.down_proj", "model.layers.72.mlp.experts.14.down_proj", "model.layers.72.mlp.experts.15.down_proj", "model.layers.72.mlp.experts.16.down_proj", "model.layers.72.mlp.experts.17.down_proj", "model.layers.72.mlp.experts.18.down_proj", "model.layers.72.mlp.experts.19.down_proj", "model.layers.72.mlp.experts.20.down_proj", "model.layers.72.mlp.experts.21.down_proj", "model.layers.72.mlp.experts.22.down_proj", "model.layers.72.mlp.experts.23.down_proj", "model.layers.72.mlp.experts.24.down_proj", "model.layers.72.mlp.experts.25.down_proj", "model.layers.72.mlp.experts.26.down_proj", "model.layers.72.mlp.experts.27.down_proj", "model.layers.72.mlp.experts.28.down_proj", "model.layers.72.mlp.experts.29.down_proj", "model.layers.72.mlp.experts.30.down_proj", "model.layers.72.mlp.experts.31.down_proj", "model.layers.72.mlp.experts.32.down_proj", "model.layers.72.mlp.experts.33.down_proj", "model.layers.72.mlp.experts.34.down_proj", "model.layers.72.mlp.experts.35.down_proj", "model.layers.72.mlp.experts.36.down_proj", "model.layers.72.mlp.experts.37.down_proj", "model.layers.72.mlp.experts.38.down_proj", "model.layers.72.mlp.experts.39.down_proj", "model.layers.72.mlp.experts.40.down_proj", "model.layers.72.mlp.experts.41.down_proj", "model.layers.72.mlp.experts.42.down_proj", "model.layers.72.mlp.experts.43.down_proj", "model.layers.72.mlp.experts.44.down_proj", "model.layers.72.mlp.experts.45.down_proj", "model.layers.72.mlp.experts.46.down_proj", "model.layers.72.mlp.experts.47.down_proj", "model.layers.72.mlp.experts.48.down_proj", "model.layers.72.mlp.experts.49.down_proj", "model.layers.72.mlp.experts.50.down_proj", "model.layers.72.mlp.experts.51.down_proj", "model.layers.72.mlp.experts.52.down_proj", "model.layers.72.mlp.experts.53.down_proj", "model.layers.72.mlp.experts.54.down_proj", "model.layers.72.mlp.experts.55.down_proj", "model.layers.72.mlp.experts.56.down_proj", "model.layers.72.mlp.experts.57.down_proj", "model.layers.72.mlp.experts.58.down_proj", "model.layers.72.mlp.experts.59.down_proj", "model.layers.72.mlp.experts.60.down_proj", "model.layers.72.mlp.experts.61.down_proj", "model.layers.72.mlp.experts.62.down_proj", "model.layers.72.mlp.experts.63.down_proj", "model.layers.72.mlp.experts.64.down_proj", "model.layers.72.mlp.experts.65.down_proj", "model.layers.72.mlp.experts.66.down_proj", "model.layers.72.mlp.experts.67.down_proj", "model.layers.72.mlp.experts.68.down_proj", "model.layers.72.mlp.experts.69.down_proj", "model.layers.72.mlp.experts.70.down_proj", "model.layers.72.mlp.experts.71.down_proj", "model.layers.72.mlp.experts.72.down_proj", "model.layers.72.mlp.experts.73.down_proj", "model.layers.72.mlp.experts.74.down_proj", "model.layers.72.mlp.experts.75.down_proj", "model.layers.72.mlp.experts.76.down_proj", "model.layers.72.mlp.experts.77.down_proj", "model.layers.72.mlp.experts.78.down_proj", "model.layers.72.mlp.experts.79.down_proj", "model.layers.72.mlp.experts.80.down_proj", "model.layers.72.mlp.experts.81.down_proj", "model.layers.72.mlp.experts.82.down_proj", "model.layers.72.mlp.experts.83.down_proj", "model.layers.72.mlp.experts.84.down_proj", "model.layers.72.mlp.experts.85.down_proj", "model.layers.72.mlp.experts.86.down_proj", "model.layers.72.mlp.experts.87.down_proj", "model.layers.72.mlp.experts.88.down_proj", "model.layers.72.mlp.experts.89.down_proj", "model.layers.72.mlp.experts.90.down_proj", "model.layers.72.mlp.experts.91.down_proj", "model.layers.72.mlp.experts.92.down_proj", "model.layers.72.mlp.experts.93.down_proj", "model.layers.72.mlp.experts.94.down_proj", "model.layers.72.mlp.experts.95.down_proj", "model.layers.72.mlp.experts.96.down_proj", "model.layers.72.mlp.experts.97.down_proj", "model.layers.72.mlp.experts.98.down_proj", "model.layers.72.mlp.experts.99.down_proj", "model.layers.72.mlp.experts.100.down_proj", "model.layers.72.mlp.experts.101.down_proj", "model.layers.72.mlp.experts.102.down_proj", "model.layers.72.mlp.experts.103.down_proj", "model.layers.72.mlp.experts.104.down_proj", "model.layers.72.mlp.experts.105.down_proj", "model.layers.72.mlp.experts.106.down_proj", "model.layers.72.mlp.experts.107.down_proj", "model.layers.72.mlp.experts.108.down_proj", "model.layers.72.mlp.experts.109.down_proj", "model.layers.72.mlp.experts.110.down_proj", "model.layers.72.mlp.experts.111.down_proj", "model.layers.72.mlp.experts.112.down_proj", "model.layers.72.mlp.experts.113.down_proj", "model.layers.72.mlp.experts.114.down_proj", "model.layers.72.mlp.experts.115.down_proj", "model.layers.72.mlp.experts.116.down_proj", "model.layers.72.mlp.experts.117.down_proj", "model.layers.72.mlp.experts.118.down_proj", "model.layers.72.mlp.experts.119.down_proj", "model.layers.72.mlp.experts.120.down_proj", "model.layers.72.mlp.experts.121.down_proj", "model.layers.72.mlp.experts.122.down_proj", "model.layers.72.mlp.experts.123.down_proj", "model.layers.72.mlp.experts.124.down_proj", "model.layers.72.mlp.experts.125.down_proj", "model.layers.72.mlp.experts.126.down_proj", "model.layers.72.mlp.experts.127.down_proj", "model.layers.72.mlp.experts.128.down_proj", "model.layers.72.mlp.experts.129.down_proj", "model.layers.72.mlp.experts.130.down_proj", "model.layers.72.mlp.experts.131.down_proj", "model.layers.72.mlp.experts.132.down_proj", "model.layers.72.mlp.experts.133.down_proj", "model.layers.72.mlp.experts.134.down_proj", "model.layers.72.mlp.experts.135.down_proj", "model.layers.72.mlp.experts.136.down_proj", "model.layers.72.mlp.experts.137.down_proj", "model.layers.72.mlp.experts.138.down_proj", "model.layers.72.mlp.experts.139.down_proj", "model.layers.72.mlp.experts.140.down_proj", "model.layers.72.mlp.experts.141.down_proj", "model.layers.72.mlp.experts.142.down_proj", "model.layers.72.mlp.experts.143.down_proj", "model.layers.72.mlp.experts.144.down_proj", "model.layers.72.mlp.experts.145.down_proj", "model.layers.72.mlp.experts.146.down_proj", "model.layers.72.mlp.experts.147.down_proj", "model.layers.72.mlp.experts.148.down_proj", "model.layers.72.mlp.experts.149.down_proj", "model.layers.72.mlp.experts.150.down_proj", "model.layers.72.mlp.experts.151.down_proj", "model.layers.72.mlp.experts.152.down_proj", "model.layers.72.mlp.experts.153.down_proj", "model.layers.72.mlp.experts.154.down_proj", "model.layers.72.mlp.experts.155.down_proj", "model.layers.72.mlp.experts.156.down_proj", "model.layers.72.mlp.experts.157.down_proj", "model.layers.72.mlp.experts.158.down_proj", "model.layers.72.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.5811924822627457e-05, "dbits": 1258291200 }, { "dkld": -2.180621959268006e-06, "dbits": 2516582400 } ] }, { "idx": 435, "layers": [ "model.layers.73.self_attn.q_proj" ], "candidates": [ { "dkld": 6.45171385258575e-06, "dbits": 62914560 }, { "dkld": 9.265728294849396e-06, "dbits": 125829120 } ] }, { "idx": 436, "layers": [ "model.layers.73.self_attn.k_proj", "model.layers.73.self_attn.v_proj" ], "candidates": [ { "dkld": 3.4897192381323425e-05, "dbits": 10485760 }, { "dkld": 3.3625774085522045e-05, "dbits": 20971520 } ] }, { "idx": 437, "layers": [ "model.layers.73.self_attn.o_proj" ], "candidates": [ { "dkld": 1.1122087016701698e-05, "dbits": 62914560 }, { "dkld": 1.6268203034998374e-05, "dbits": 125829120 } ] }, { "idx": 438, "layers": [ "model.layers.73.mlp.shared_experts.gate_proj", "model.layers.73.mlp.shared_experts.up_proj", "model.layers.73.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -1.9304873421787522e-05, "dbits": 23592960 }, { "dkld": -2.5898916646838188e-05, "dbits": 47185920 } ] }, { "idx": 439, "layers": [ "model.layers.73.mlp.experts.0.gate_proj", "model.layers.73.mlp.experts.1.gate_proj", "model.layers.73.mlp.experts.2.gate_proj", "model.layers.73.mlp.experts.3.gate_proj", "model.layers.73.mlp.experts.4.gate_proj", "model.layers.73.mlp.experts.5.gate_proj", "model.layers.73.mlp.experts.6.gate_proj", "model.layers.73.mlp.experts.7.gate_proj", "model.layers.73.mlp.experts.8.gate_proj", "model.layers.73.mlp.experts.9.gate_proj", "model.layers.73.mlp.experts.10.gate_proj", "model.layers.73.mlp.experts.11.gate_proj", "model.layers.73.mlp.experts.12.gate_proj", "model.layers.73.mlp.experts.13.gate_proj", "model.layers.73.mlp.experts.14.gate_proj", "model.layers.73.mlp.experts.15.gate_proj", "model.layers.73.mlp.experts.16.gate_proj", "model.layers.73.mlp.experts.17.gate_proj", "model.layers.73.mlp.experts.18.gate_proj", "model.layers.73.mlp.experts.19.gate_proj", "model.layers.73.mlp.experts.20.gate_proj", "model.layers.73.mlp.experts.21.gate_proj", "model.layers.73.mlp.experts.22.gate_proj", "model.layers.73.mlp.experts.23.gate_proj", "model.layers.73.mlp.experts.24.gate_proj", "model.layers.73.mlp.experts.25.gate_proj", "model.layers.73.mlp.experts.26.gate_proj", "model.layers.73.mlp.experts.27.gate_proj", "model.layers.73.mlp.experts.28.gate_proj", "model.layers.73.mlp.experts.29.gate_proj", "model.layers.73.mlp.experts.30.gate_proj", "model.layers.73.mlp.experts.31.gate_proj", "model.layers.73.mlp.experts.32.gate_proj", "model.layers.73.mlp.experts.33.gate_proj", "model.layers.73.mlp.experts.34.gate_proj", "model.layers.73.mlp.experts.35.gate_proj", "model.layers.73.mlp.experts.36.gate_proj", "model.layers.73.mlp.experts.37.gate_proj", "model.layers.73.mlp.experts.38.gate_proj", "model.layers.73.mlp.experts.39.gate_proj", "model.layers.73.mlp.experts.40.gate_proj", "model.layers.73.mlp.experts.41.gate_proj", "model.layers.73.mlp.experts.42.gate_proj", "model.layers.73.mlp.experts.43.gate_proj", "model.layers.73.mlp.experts.44.gate_proj", "model.layers.73.mlp.experts.45.gate_proj", "model.layers.73.mlp.experts.46.gate_proj", "model.layers.73.mlp.experts.47.gate_proj", "model.layers.73.mlp.experts.48.gate_proj", "model.layers.73.mlp.experts.49.gate_proj", "model.layers.73.mlp.experts.50.gate_proj", "model.layers.73.mlp.experts.51.gate_proj", "model.layers.73.mlp.experts.52.gate_proj", "model.layers.73.mlp.experts.53.gate_proj", "model.layers.73.mlp.experts.54.gate_proj", "model.layers.73.mlp.experts.55.gate_proj", "model.layers.73.mlp.experts.56.gate_proj", "model.layers.73.mlp.experts.57.gate_proj", "model.layers.73.mlp.experts.58.gate_proj", "model.layers.73.mlp.experts.59.gate_proj", "model.layers.73.mlp.experts.60.gate_proj", "model.layers.73.mlp.experts.61.gate_proj", "model.layers.73.mlp.experts.62.gate_proj", "model.layers.73.mlp.experts.63.gate_proj", "model.layers.73.mlp.experts.64.gate_proj", "model.layers.73.mlp.experts.65.gate_proj", "model.layers.73.mlp.experts.66.gate_proj", "model.layers.73.mlp.experts.67.gate_proj", "model.layers.73.mlp.experts.68.gate_proj", "model.layers.73.mlp.experts.69.gate_proj", "model.layers.73.mlp.experts.70.gate_proj", "model.layers.73.mlp.experts.71.gate_proj", "model.layers.73.mlp.experts.72.gate_proj", "model.layers.73.mlp.experts.73.gate_proj", "model.layers.73.mlp.experts.74.gate_proj", "model.layers.73.mlp.experts.75.gate_proj", "model.layers.73.mlp.experts.76.gate_proj", "model.layers.73.mlp.experts.77.gate_proj", "model.layers.73.mlp.experts.78.gate_proj", "model.layers.73.mlp.experts.79.gate_proj", "model.layers.73.mlp.experts.80.gate_proj", "model.layers.73.mlp.experts.81.gate_proj", "model.layers.73.mlp.experts.82.gate_proj", "model.layers.73.mlp.experts.83.gate_proj", "model.layers.73.mlp.experts.84.gate_proj", "model.layers.73.mlp.experts.85.gate_proj", "model.layers.73.mlp.experts.86.gate_proj", "model.layers.73.mlp.experts.87.gate_proj", "model.layers.73.mlp.experts.88.gate_proj", "model.layers.73.mlp.experts.89.gate_proj", "model.layers.73.mlp.experts.90.gate_proj", "model.layers.73.mlp.experts.91.gate_proj", "model.layers.73.mlp.experts.92.gate_proj", "model.layers.73.mlp.experts.93.gate_proj", "model.layers.73.mlp.experts.94.gate_proj", "model.layers.73.mlp.experts.95.gate_proj", "model.layers.73.mlp.experts.96.gate_proj", "model.layers.73.mlp.experts.97.gate_proj", "model.layers.73.mlp.experts.98.gate_proj", "model.layers.73.mlp.experts.99.gate_proj", "model.layers.73.mlp.experts.100.gate_proj", "model.layers.73.mlp.experts.101.gate_proj", "model.layers.73.mlp.experts.102.gate_proj", "model.layers.73.mlp.experts.103.gate_proj", "model.layers.73.mlp.experts.104.gate_proj", "model.layers.73.mlp.experts.105.gate_proj", "model.layers.73.mlp.experts.106.gate_proj", "model.layers.73.mlp.experts.107.gate_proj", "model.layers.73.mlp.experts.108.gate_proj", "model.layers.73.mlp.experts.109.gate_proj", "model.layers.73.mlp.experts.110.gate_proj", "model.layers.73.mlp.experts.111.gate_proj", "model.layers.73.mlp.experts.112.gate_proj", "model.layers.73.mlp.experts.113.gate_proj", "model.layers.73.mlp.experts.114.gate_proj", "model.layers.73.mlp.experts.115.gate_proj", "model.layers.73.mlp.experts.116.gate_proj", "model.layers.73.mlp.experts.117.gate_proj", "model.layers.73.mlp.experts.118.gate_proj", "model.layers.73.mlp.experts.119.gate_proj", "model.layers.73.mlp.experts.120.gate_proj", "model.layers.73.mlp.experts.121.gate_proj", "model.layers.73.mlp.experts.122.gate_proj", "model.layers.73.mlp.experts.123.gate_proj", "model.layers.73.mlp.experts.124.gate_proj", "model.layers.73.mlp.experts.125.gate_proj", "model.layers.73.mlp.experts.126.gate_proj", "model.layers.73.mlp.experts.127.gate_proj", "model.layers.73.mlp.experts.128.gate_proj", "model.layers.73.mlp.experts.129.gate_proj", "model.layers.73.mlp.experts.130.gate_proj", "model.layers.73.mlp.experts.131.gate_proj", "model.layers.73.mlp.experts.132.gate_proj", "model.layers.73.mlp.experts.133.gate_proj", "model.layers.73.mlp.experts.134.gate_proj", "model.layers.73.mlp.experts.135.gate_proj", "model.layers.73.mlp.experts.136.gate_proj", "model.layers.73.mlp.experts.137.gate_proj", "model.layers.73.mlp.experts.138.gate_proj", "model.layers.73.mlp.experts.139.gate_proj", "model.layers.73.mlp.experts.140.gate_proj", "model.layers.73.mlp.experts.141.gate_proj", "model.layers.73.mlp.experts.142.gate_proj", "model.layers.73.mlp.experts.143.gate_proj", "model.layers.73.mlp.experts.144.gate_proj", "model.layers.73.mlp.experts.145.gate_proj", "model.layers.73.mlp.experts.146.gate_proj", "model.layers.73.mlp.experts.147.gate_proj", "model.layers.73.mlp.experts.148.gate_proj", "model.layers.73.mlp.experts.149.gate_proj", "model.layers.73.mlp.experts.150.gate_proj", "model.layers.73.mlp.experts.151.gate_proj", "model.layers.73.mlp.experts.152.gate_proj", "model.layers.73.mlp.experts.153.gate_proj", "model.layers.73.mlp.experts.154.gate_proj", "model.layers.73.mlp.experts.155.gate_proj", "model.layers.73.mlp.experts.156.gate_proj", "model.layers.73.mlp.experts.157.gate_proj", "model.layers.73.mlp.experts.158.gate_proj", "model.layers.73.mlp.experts.159.gate_proj", "model.layers.73.mlp.experts.0.up_proj", "model.layers.73.mlp.experts.1.up_proj", "model.layers.73.mlp.experts.2.up_proj", "model.layers.73.mlp.experts.3.up_proj", "model.layers.73.mlp.experts.4.up_proj", "model.layers.73.mlp.experts.5.up_proj", "model.layers.73.mlp.experts.6.up_proj", "model.layers.73.mlp.experts.7.up_proj", "model.layers.73.mlp.experts.8.up_proj", "model.layers.73.mlp.experts.9.up_proj", "model.layers.73.mlp.experts.10.up_proj", "model.layers.73.mlp.experts.11.up_proj", "model.layers.73.mlp.experts.12.up_proj", "model.layers.73.mlp.experts.13.up_proj", "model.layers.73.mlp.experts.14.up_proj", "model.layers.73.mlp.experts.15.up_proj", "model.layers.73.mlp.experts.16.up_proj", "model.layers.73.mlp.experts.17.up_proj", "model.layers.73.mlp.experts.18.up_proj", "model.layers.73.mlp.experts.19.up_proj", "model.layers.73.mlp.experts.20.up_proj", "model.layers.73.mlp.experts.21.up_proj", "model.layers.73.mlp.experts.22.up_proj", "model.layers.73.mlp.experts.23.up_proj", "model.layers.73.mlp.experts.24.up_proj", "model.layers.73.mlp.experts.25.up_proj", "model.layers.73.mlp.experts.26.up_proj", "model.layers.73.mlp.experts.27.up_proj", "model.layers.73.mlp.experts.28.up_proj", "model.layers.73.mlp.experts.29.up_proj", "model.layers.73.mlp.experts.30.up_proj", "model.layers.73.mlp.experts.31.up_proj", "model.layers.73.mlp.experts.32.up_proj", "model.layers.73.mlp.experts.33.up_proj", "model.layers.73.mlp.experts.34.up_proj", "model.layers.73.mlp.experts.35.up_proj", "model.layers.73.mlp.experts.36.up_proj", "model.layers.73.mlp.experts.37.up_proj", "model.layers.73.mlp.experts.38.up_proj", "model.layers.73.mlp.experts.39.up_proj", "model.layers.73.mlp.experts.40.up_proj", "model.layers.73.mlp.experts.41.up_proj", "model.layers.73.mlp.experts.42.up_proj", "model.layers.73.mlp.experts.43.up_proj", "model.layers.73.mlp.experts.44.up_proj", "model.layers.73.mlp.experts.45.up_proj", "model.layers.73.mlp.experts.46.up_proj", "model.layers.73.mlp.experts.47.up_proj", "model.layers.73.mlp.experts.48.up_proj", "model.layers.73.mlp.experts.49.up_proj", "model.layers.73.mlp.experts.50.up_proj", "model.layers.73.mlp.experts.51.up_proj", "model.layers.73.mlp.experts.52.up_proj", "model.layers.73.mlp.experts.53.up_proj", "model.layers.73.mlp.experts.54.up_proj", "model.layers.73.mlp.experts.55.up_proj", "model.layers.73.mlp.experts.56.up_proj", "model.layers.73.mlp.experts.57.up_proj", "model.layers.73.mlp.experts.58.up_proj", "model.layers.73.mlp.experts.59.up_proj", "model.layers.73.mlp.experts.60.up_proj", "model.layers.73.mlp.experts.61.up_proj", "model.layers.73.mlp.experts.62.up_proj", "model.layers.73.mlp.experts.63.up_proj", "model.layers.73.mlp.experts.64.up_proj", "model.layers.73.mlp.experts.65.up_proj", "model.layers.73.mlp.experts.66.up_proj", "model.layers.73.mlp.experts.67.up_proj", "model.layers.73.mlp.experts.68.up_proj", "model.layers.73.mlp.experts.69.up_proj", "model.layers.73.mlp.experts.70.up_proj", "model.layers.73.mlp.experts.71.up_proj", "model.layers.73.mlp.experts.72.up_proj", "model.layers.73.mlp.experts.73.up_proj", "model.layers.73.mlp.experts.74.up_proj", "model.layers.73.mlp.experts.75.up_proj", "model.layers.73.mlp.experts.76.up_proj", "model.layers.73.mlp.experts.77.up_proj", "model.layers.73.mlp.experts.78.up_proj", "model.layers.73.mlp.experts.79.up_proj", "model.layers.73.mlp.experts.80.up_proj", "model.layers.73.mlp.experts.81.up_proj", "model.layers.73.mlp.experts.82.up_proj", "model.layers.73.mlp.experts.83.up_proj", "model.layers.73.mlp.experts.84.up_proj", "model.layers.73.mlp.experts.85.up_proj", "model.layers.73.mlp.experts.86.up_proj", "model.layers.73.mlp.experts.87.up_proj", "model.layers.73.mlp.experts.88.up_proj", "model.layers.73.mlp.experts.89.up_proj", "model.layers.73.mlp.experts.90.up_proj", "model.layers.73.mlp.experts.91.up_proj", "model.layers.73.mlp.experts.92.up_proj", "model.layers.73.mlp.experts.93.up_proj", "model.layers.73.mlp.experts.94.up_proj", "model.layers.73.mlp.experts.95.up_proj", "model.layers.73.mlp.experts.96.up_proj", "model.layers.73.mlp.experts.97.up_proj", "model.layers.73.mlp.experts.98.up_proj", "model.layers.73.mlp.experts.99.up_proj", "model.layers.73.mlp.experts.100.up_proj", "model.layers.73.mlp.experts.101.up_proj", "model.layers.73.mlp.experts.102.up_proj", "model.layers.73.mlp.experts.103.up_proj", "model.layers.73.mlp.experts.104.up_proj", "model.layers.73.mlp.experts.105.up_proj", "model.layers.73.mlp.experts.106.up_proj", "model.layers.73.mlp.experts.107.up_proj", "model.layers.73.mlp.experts.108.up_proj", "model.layers.73.mlp.experts.109.up_proj", "model.layers.73.mlp.experts.110.up_proj", "model.layers.73.mlp.experts.111.up_proj", "model.layers.73.mlp.experts.112.up_proj", "model.layers.73.mlp.experts.113.up_proj", "model.layers.73.mlp.experts.114.up_proj", "model.layers.73.mlp.experts.115.up_proj", "model.layers.73.mlp.experts.116.up_proj", "model.layers.73.mlp.experts.117.up_proj", "model.layers.73.mlp.experts.118.up_proj", "model.layers.73.mlp.experts.119.up_proj", "model.layers.73.mlp.experts.120.up_proj", "model.layers.73.mlp.experts.121.up_proj", "model.layers.73.mlp.experts.122.up_proj", "model.layers.73.mlp.experts.123.up_proj", "model.layers.73.mlp.experts.124.up_proj", "model.layers.73.mlp.experts.125.up_proj", "model.layers.73.mlp.experts.126.up_proj", "model.layers.73.mlp.experts.127.up_proj", "model.layers.73.mlp.experts.128.up_proj", "model.layers.73.mlp.experts.129.up_proj", "model.layers.73.mlp.experts.130.up_proj", "model.layers.73.mlp.experts.131.up_proj", "model.layers.73.mlp.experts.132.up_proj", "model.layers.73.mlp.experts.133.up_proj", "model.layers.73.mlp.experts.134.up_proj", "model.layers.73.mlp.experts.135.up_proj", "model.layers.73.mlp.experts.136.up_proj", "model.layers.73.mlp.experts.137.up_proj", "model.layers.73.mlp.experts.138.up_proj", "model.layers.73.mlp.experts.139.up_proj", "model.layers.73.mlp.experts.140.up_proj", "model.layers.73.mlp.experts.141.up_proj", "model.layers.73.mlp.experts.142.up_proj", "model.layers.73.mlp.experts.143.up_proj", "model.layers.73.mlp.experts.144.up_proj", "model.layers.73.mlp.experts.145.up_proj", "model.layers.73.mlp.experts.146.up_proj", "model.layers.73.mlp.experts.147.up_proj", "model.layers.73.mlp.experts.148.up_proj", "model.layers.73.mlp.experts.149.up_proj", "model.layers.73.mlp.experts.150.up_proj", "model.layers.73.mlp.experts.151.up_proj", "model.layers.73.mlp.experts.152.up_proj", "model.layers.73.mlp.experts.153.up_proj", "model.layers.73.mlp.experts.154.up_proj", "model.layers.73.mlp.experts.155.up_proj", "model.layers.73.mlp.experts.156.up_proj", "model.layers.73.mlp.experts.157.up_proj", "model.layers.73.mlp.experts.158.up_proj", "model.layers.73.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.2222304940225082e-05, "dbits": 2516582400 }, { "dkld": 2.7107540518048895e-06, "dbits": 5033164800 } ] }, { "idx": 440, "layers": [ "model.layers.73.mlp.experts.0.down_proj", "model.layers.73.mlp.experts.1.down_proj", "model.layers.73.mlp.experts.2.down_proj", "model.layers.73.mlp.experts.3.down_proj", "model.layers.73.mlp.experts.4.down_proj", "model.layers.73.mlp.experts.5.down_proj", "model.layers.73.mlp.experts.6.down_proj", "model.layers.73.mlp.experts.7.down_proj", "model.layers.73.mlp.experts.8.down_proj", "model.layers.73.mlp.experts.9.down_proj", "model.layers.73.mlp.experts.10.down_proj", "model.layers.73.mlp.experts.11.down_proj", "model.layers.73.mlp.experts.12.down_proj", "model.layers.73.mlp.experts.13.down_proj", "model.layers.73.mlp.experts.14.down_proj", "model.layers.73.mlp.experts.15.down_proj", "model.layers.73.mlp.experts.16.down_proj", "model.layers.73.mlp.experts.17.down_proj", "model.layers.73.mlp.experts.18.down_proj", "model.layers.73.mlp.experts.19.down_proj", "model.layers.73.mlp.experts.20.down_proj", "model.layers.73.mlp.experts.21.down_proj", "model.layers.73.mlp.experts.22.down_proj", "model.layers.73.mlp.experts.23.down_proj", "model.layers.73.mlp.experts.24.down_proj", "model.layers.73.mlp.experts.25.down_proj", "model.layers.73.mlp.experts.26.down_proj", "model.layers.73.mlp.experts.27.down_proj", "model.layers.73.mlp.experts.28.down_proj", "model.layers.73.mlp.experts.29.down_proj", "model.layers.73.mlp.experts.30.down_proj", "model.layers.73.mlp.experts.31.down_proj", "model.layers.73.mlp.experts.32.down_proj", "model.layers.73.mlp.experts.33.down_proj", "model.layers.73.mlp.experts.34.down_proj", "model.layers.73.mlp.experts.35.down_proj", "model.layers.73.mlp.experts.36.down_proj", "model.layers.73.mlp.experts.37.down_proj", "model.layers.73.mlp.experts.38.down_proj", "model.layers.73.mlp.experts.39.down_proj", "model.layers.73.mlp.experts.40.down_proj", "model.layers.73.mlp.experts.41.down_proj", "model.layers.73.mlp.experts.42.down_proj", "model.layers.73.mlp.experts.43.down_proj", "model.layers.73.mlp.experts.44.down_proj", "model.layers.73.mlp.experts.45.down_proj", "model.layers.73.mlp.experts.46.down_proj", "model.layers.73.mlp.experts.47.down_proj", "model.layers.73.mlp.experts.48.down_proj", "model.layers.73.mlp.experts.49.down_proj", "model.layers.73.mlp.experts.50.down_proj", "model.layers.73.mlp.experts.51.down_proj", "model.layers.73.mlp.experts.52.down_proj", "model.layers.73.mlp.experts.53.down_proj", "model.layers.73.mlp.experts.54.down_proj", "model.layers.73.mlp.experts.55.down_proj", "model.layers.73.mlp.experts.56.down_proj", "model.layers.73.mlp.experts.57.down_proj", "model.layers.73.mlp.experts.58.down_proj", "model.layers.73.mlp.experts.59.down_proj", "model.layers.73.mlp.experts.60.down_proj", "model.layers.73.mlp.experts.61.down_proj", "model.layers.73.mlp.experts.62.down_proj", "model.layers.73.mlp.experts.63.down_proj", "model.layers.73.mlp.experts.64.down_proj", "model.layers.73.mlp.experts.65.down_proj", "model.layers.73.mlp.experts.66.down_proj", "model.layers.73.mlp.experts.67.down_proj", "model.layers.73.mlp.experts.68.down_proj", "model.layers.73.mlp.experts.69.down_proj", "model.layers.73.mlp.experts.70.down_proj", "model.layers.73.mlp.experts.71.down_proj", "model.layers.73.mlp.experts.72.down_proj", "model.layers.73.mlp.experts.73.down_proj", "model.layers.73.mlp.experts.74.down_proj", "model.layers.73.mlp.experts.75.down_proj", "model.layers.73.mlp.experts.76.down_proj", "model.layers.73.mlp.experts.77.down_proj", "model.layers.73.mlp.experts.78.down_proj", "model.layers.73.mlp.experts.79.down_proj", "model.layers.73.mlp.experts.80.down_proj", "model.layers.73.mlp.experts.81.down_proj", "model.layers.73.mlp.experts.82.down_proj", "model.layers.73.mlp.experts.83.down_proj", "model.layers.73.mlp.experts.84.down_proj", "model.layers.73.mlp.experts.85.down_proj", "model.layers.73.mlp.experts.86.down_proj", "model.layers.73.mlp.experts.87.down_proj", "model.layers.73.mlp.experts.88.down_proj", "model.layers.73.mlp.experts.89.down_proj", "model.layers.73.mlp.experts.90.down_proj", "model.layers.73.mlp.experts.91.down_proj", "model.layers.73.mlp.experts.92.down_proj", "model.layers.73.mlp.experts.93.down_proj", "model.layers.73.mlp.experts.94.down_proj", "model.layers.73.mlp.experts.95.down_proj", "model.layers.73.mlp.experts.96.down_proj", "model.layers.73.mlp.experts.97.down_proj", "model.layers.73.mlp.experts.98.down_proj", "model.layers.73.mlp.experts.99.down_proj", "model.layers.73.mlp.experts.100.down_proj", "model.layers.73.mlp.experts.101.down_proj", "model.layers.73.mlp.experts.102.down_proj", "model.layers.73.mlp.experts.103.down_proj", "model.layers.73.mlp.experts.104.down_proj", "model.layers.73.mlp.experts.105.down_proj", "model.layers.73.mlp.experts.106.down_proj", "model.layers.73.mlp.experts.107.down_proj", "model.layers.73.mlp.experts.108.down_proj", "model.layers.73.mlp.experts.109.down_proj", "model.layers.73.mlp.experts.110.down_proj", "model.layers.73.mlp.experts.111.down_proj", "model.layers.73.mlp.experts.112.down_proj", "model.layers.73.mlp.experts.113.down_proj", "model.layers.73.mlp.experts.114.down_proj", "model.layers.73.mlp.experts.115.down_proj", "model.layers.73.mlp.experts.116.down_proj", "model.layers.73.mlp.experts.117.down_proj", "model.layers.73.mlp.experts.118.down_proj", "model.layers.73.mlp.experts.119.down_proj", "model.layers.73.mlp.experts.120.down_proj", "model.layers.73.mlp.experts.121.down_proj", "model.layers.73.mlp.experts.122.down_proj", "model.layers.73.mlp.experts.123.down_proj", "model.layers.73.mlp.experts.124.down_proj", "model.layers.73.mlp.experts.125.down_proj", "model.layers.73.mlp.experts.126.down_proj", "model.layers.73.mlp.experts.127.down_proj", "model.layers.73.mlp.experts.128.down_proj", "model.layers.73.mlp.experts.129.down_proj", "model.layers.73.mlp.experts.130.down_proj", "model.layers.73.mlp.experts.131.down_proj", "model.layers.73.mlp.experts.132.down_proj", "model.layers.73.mlp.experts.133.down_proj", "model.layers.73.mlp.experts.134.down_proj", "model.layers.73.mlp.experts.135.down_proj", "model.layers.73.mlp.experts.136.down_proj", "model.layers.73.mlp.experts.137.down_proj", "model.layers.73.mlp.experts.138.down_proj", "model.layers.73.mlp.experts.139.down_proj", "model.layers.73.mlp.experts.140.down_proj", "model.layers.73.mlp.experts.141.down_proj", "model.layers.73.mlp.experts.142.down_proj", "model.layers.73.mlp.experts.143.down_proj", "model.layers.73.mlp.experts.144.down_proj", "model.layers.73.mlp.experts.145.down_proj", "model.layers.73.mlp.experts.146.down_proj", "model.layers.73.mlp.experts.147.down_proj", "model.layers.73.mlp.experts.148.down_proj", "model.layers.73.mlp.experts.149.down_proj", "model.layers.73.mlp.experts.150.down_proj", "model.layers.73.mlp.experts.151.down_proj", "model.layers.73.mlp.experts.152.down_proj", "model.layers.73.mlp.experts.153.down_proj", "model.layers.73.mlp.experts.154.down_proj", "model.layers.73.mlp.experts.155.down_proj", "model.layers.73.mlp.experts.156.down_proj", "model.layers.73.mlp.experts.157.down_proj", "model.layers.73.mlp.experts.158.down_proj", "model.layers.73.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 6.337999366223812e-06, "dbits": 1258291200 }, { "dkld": -1.2456672266125679e-05, "dbits": 2516582400 } ] }, { "idx": 441, "layers": [ "model.layers.74.self_attn.q_proj" ], "candidates": [ { "dkld": 1.1964701116085052e-05, "dbits": 62914560 }, { "dkld": 1.101219095290401e-06, "dbits": 125829120 } ] }, { "idx": 442, "layers": [ "model.layers.74.self_attn.k_proj", "model.layers.74.self_attn.v_proj" ], "candidates": [ { "dkld": 1.0793330147862434e-05, "dbits": 10485760 }, { "dkld": -9.77835152298108e-06, "dbits": 20971520 } ] }, { "idx": 443, "layers": [ "model.layers.74.self_attn.o_proj" ], "candidates": [ { "dkld": -1.6998220235108635e-05, "dbits": 62914560 }, { "dkld": -2.57834326475824e-06, "dbits": 125829120 } ] }, { "idx": 444, "layers": [ "model.layers.74.mlp.shared_experts.gate_proj", "model.layers.74.mlp.shared_experts.up_proj", "model.layers.74.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 2.7796952053904533e-05, "dbits": 23592960 }, { "dkld": 3.866455517709255e-05, "dbits": 47185920 } ] }, { "idx": 445, "layers": [ "model.layers.74.mlp.experts.0.gate_proj", "model.layers.74.mlp.experts.1.gate_proj", "model.layers.74.mlp.experts.2.gate_proj", "model.layers.74.mlp.experts.3.gate_proj", "model.layers.74.mlp.experts.4.gate_proj", "model.layers.74.mlp.experts.5.gate_proj", "model.layers.74.mlp.experts.6.gate_proj", "model.layers.74.mlp.experts.7.gate_proj", "model.layers.74.mlp.experts.8.gate_proj", "model.layers.74.mlp.experts.9.gate_proj", "model.layers.74.mlp.experts.10.gate_proj", "model.layers.74.mlp.experts.11.gate_proj", "model.layers.74.mlp.experts.12.gate_proj", "model.layers.74.mlp.experts.13.gate_proj", "model.layers.74.mlp.experts.14.gate_proj", "model.layers.74.mlp.experts.15.gate_proj", "model.layers.74.mlp.experts.16.gate_proj", "model.layers.74.mlp.experts.17.gate_proj", "model.layers.74.mlp.experts.18.gate_proj", "model.layers.74.mlp.experts.19.gate_proj", "model.layers.74.mlp.experts.20.gate_proj", "model.layers.74.mlp.experts.21.gate_proj", "model.layers.74.mlp.experts.22.gate_proj", "model.layers.74.mlp.experts.23.gate_proj", "model.layers.74.mlp.experts.24.gate_proj", "model.layers.74.mlp.experts.25.gate_proj", "model.layers.74.mlp.experts.26.gate_proj", "model.layers.74.mlp.experts.27.gate_proj", "model.layers.74.mlp.experts.28.gate_proj", "model.layers.74.mlp.experts.29.gate_proj", "model.layers.74.mlp.experts.30.gate_proj", "model.layers.74.mlp.experts.31.gate_proj", "model.layers.74.mlp.experts.32.gate_proj", "model.layers.74.mlp.experts.33.gate_proj", "model.layers.74.mlp.experts.34.gate_proj", "model.layers.74.mlp.experts.35.gate_proj", "model.layers.74.mlp.experts.36.gate_proj", "model.layers.74.mlp.experts.37.gate_proj", "model.layers.74.mlp.experts.38.gate_proj", "model.layers.74.mlp.experts.39.gate_proj", "model.layers.74.mlp.experts.40.gate_proj", "model.layers.74.mlp.experts.41.gate_proj", "model.layers.74.mlp.experts.42.gate_proj", "model.layers.74.mlp.experts.43.gate_proj", "model.layers.74.mlp.experts.44.gate_proj", "model.layers.74.mlp.experts.45.gate_proj", "model.layers.74.mlp.experts.46.gate_proj", "model.layers.74.mlp.experts.47.gate_proj", "model.layers.74.mlp.experts.48.gate_proj", "model.layers.74.mlp.experts.49.gate_proj", "model.layers.74.mlp.experts.50.gate_proj", "model.layers.74.mlp.experts.51.gate_proj", "model.layers.74.mlp.experts.52.gate_proj", "model.layers.74.mlp.experts.53.gate_proj", "model.layers.74.mlp.experts.54.gate_proj", "model.layers.74.mlp.experts.55.gate_proj", "model.layers.74.mlp.experts.56.gate_proj", "model.layers.74.mlp.experts.57.gate_proj", "model.layers.74.mlp.experts.58.gate_proj", "model.layers.74.mlp.experts.59.gate_proj", "model.layers.74.mlp.experts.60.gate_proj", "model.layers.74.mlp.experts.61.gate_proj", "model.layers.74.mlp.experts.62.gate_proj", "model.layers.74.mlp.experts.63.gate_proj", "model.layers.74.mlp.experts.64.gate_proj", "model.layers.74.mlp.experts.65.gate_proj", "model.layers.74.mlp.experts.66.gate_proj", "model.layers.74.mlp.experts.67.gate_proj", "model.layers.74.mlp.experts.68.gate_proj", "model.layers.74.mlp.experts.69.gate_proj", "model.layers.74.mlp.experts.70.gate_proj", "model.layers.74.mlp.experts.71.gate_proj", "model.layers.74.mlp.experts.72.gate_proj", "model.layers.74.mlp.experts.73.gate_proj", "model.layers.74.mlp.experts.74.gate_proj", "model.layers.74.mlp.experts.75.gate_proj", "model.layers.74.mlp.experts.76.gate_proj", "model.layers.74.mlp.experts.77.gate_proj", "model.layers.74.mlp.experts.78.gate_proj", "model.layers.74.mlp.experts.79.gate_proj", "model.layers.74.mlp.experts.80.gate_proj", "model.layers.74.mlp.experts.81.gate_proj", "model.layers.74.mlp.experts.82.gate_proj", "model.layers.74.mlp.experts.83.gate_proj", "model.layers.74.mlp.experts.84.gate_proj", "model.layers.74.mlp.experts.85.gate_proj", "model.layers.74.mlp.experts.86.gate_proj", "model.layers.74.mlp.experts.87.gate_proj", "model.layers.74.mlp.experts.88.gate_proj", "model.layers.74.mlp.experts.89.gate_proj", "model.layers.74.mlp.experts.90.gate_proj", "model.layers.74.mlp.experts.91.gate_proj", "model.layers.74.mlp.experts.92.gate_proj", "model.layers.74.mlp.experts.93.gate_proj", "model.layers.74.mlp.experts.94.gate_proj", "model.layers.74.mlp.experts.95.gate_proj", "model.layers.74.mlp.experts.96.gate_proj", "model.layers.74.mlp.experts.97.gate_proj", "model.layers.74.mlp.experts.98.gate_proj", "model.layers.74.mlp.experts.99.gate_proj", "model.layers.74.mlp.experts.100.gate_proj", "model.layers.74.mlp.experts.101.gate_proj", "model.layers.74.mlp.experts.102.gate_proj", "model.layers.74.mlp.experts.103.gate_proj", "model.layers.74.mlp.experts.104.gate_proj", "model.layers.74.mlp.experts.105.gate_proj", "model.layers.74.mlp.experts.106.gate_proj", "model.layers.74.mlp.experts.107.gate_proj", "model.layers.74.mlp.experts.108.gate_proj", "model.layers.74.mlp.experts.109.gate_proj", "model.layers.74.mlp.experts.110.gate_proj", "model.layers.74.mlp.experts.111.gate_proj", "model.layers.74.mlp.experts.112.gate_proj", "model.layers.74.mlp.experts.113.gate_proj", "model.layers.74.mlp.experts.114.gate_proj", "model.layers.74.mlp.experts.115.gate_proj", "model.layers.74.mlp.experts.116.gate_proj", "model.layers.74.mlp.experts.117.gate_proj", "model.layers.74.mlp.experts.118.gate_proj", "model.layers.74.mlp.experts.119.gate_proj", "model.layers.74.mlp.experts.120.gate_proj", "model.layers.74.mlp.experts.121.gate_proj", "model.layers.74.mlp.experts.122.gate_proj", "model.layers.74.mlp.experts.123.gate_proj", "model.layers.74.mlp.experts.124.gate_proj", "model.layers.74.mlp.experts.125.gate_proj", "model.layers.74.mlp.experts.126.gate_proj", "model.layers.74.mlp.experts.127.gate_proj", "model.layers.74.mlp.experts.128.gate_proj", "model.layers.74.mlp.experts.129.gate_proj", "model.layers.74.mlp.experts.130.gate_proj", "model.layers.74.mlp.experts.131.gate_proj", "model.layers.74.mlp.experts.132.gate_proj", "model.layers.74.mlp.experts.133.gate_proj", "model.layers.74.mlp.experts.134.gate_proj", "model.layers.74.mlp.experts.135.gate_proj", "model.layers.74.mlp.experts.136.gate_proj", "model.layers.74.mlp.experts.137.gate_proj", "model.layers.74.mlp.experts.138.gate_proj", "model.layers.74.mlp.experts.139.gate_proj", "model.layers.74.mlp.experts.140.gate_proj", "model.layers.74.mlp.experts.141.gate_proj", "model.layers.74.mlp.experts.142.gate_proj", "model.layers.74.mlp.experts.143.gate_proj", "model.layers.74.mlp.experts.144.gate_proj", "model.layers.74.mlp.experts.145.gate_proj", "model.layers.74.mlp.experts.146.gate_proj", "model.layers.74.mlp.experts.147.gate_proj", "model.layers.74.mlp.experts.148.gate_proj", "model.layers.74.mlp.experts.149.gate_proj", "model.layers.74.mlp.experts.150.gate_proj", "model.layers.74.mlp.experts.151.gate_proj", "model.layers.74.mlp.experts.152.gate_proj", "model.layers.74.mlp.experts.153.gate_proj", "model.layers.74.mlp.experts.154.gate_proj", "model.layers.74.mlp.experts.155.gate_proj", "model.layers.74.mlp.experts.156.gate_proj", "model.layers.74.mlp.experts.157.gate_proj", "model.layers.74.mlp.experts.158.gate_proj", "model.layers.74.mlp.experts.159.gate_proj", "model.layers.74.mlp.experts.0.up_proj", "model.layers.74.mlp.experts.1.up_proj", "model.layers.74.mlp.experts.2.up_proj", "model.layers.74.mlp.experts.3.up_proj", "model.layers.74.mlp.experts.4.up_proj", "model.layers.74.mlp.experts.5.up_proj", "model.layers.74.mlp.experts.6.up_proj", "model.layers.74.mlp.experts.7.up_proj", "model.layers.74.mlp.experts.8.up_proj", "model.layers.74.mlp.experts.9.up_proj", "model.layers.74.mlp.experts.10.up_proj", "model.layers.74.mlp.experts.11.up_proj", "model.layers.74.mlp.experts.12.up_proj", "model.layers.74.mlp.experts.13.up_proj", "model.layers.74.mlp.experts.14.up_proj", "model.layers.74.mlp.experts.15.up_proj", "model.layers.74.mlp.experts.16.up_proj", "model.layers.74.mlp.experts.17.up_proj", "model.layers.74.mlp.experts.18.up_proj", "model.layers.74.mlp.experts.19.up_proj", "model.layers.74.mlp.experts.20.up_proj", "model.layers.74.mlp.experts.21.up_proj", "model.layers.74.mlp.experts.22.up_proj", "model.layers.74.mlp.experts.23.up_proj", "model.layers.74.mlp.experts.24.up_proj", "model.layers.74.mlp.experts.25.up_proj", "model.layers.74.mlp.experts.26.up_proj", "model.layers.74.mlp.experts.27.up_proj", "model.layers.74.mlp.experts.28.up_proj", "model.layers.74.mlp.experts.29.up_proj", "model.layers.74.mlp.experts.30.up_proj", "model.layers.74.mlp.experts.31.up_proj", "model.layers.74.mlp.experts.32.up_proj", "model.layers.74.mlp.experts.33.up_proj", "model.layers.74.mlp.experts.34.up_proj", "model.layers.74.mlp.experts.35.up_proj", "model.layers.74.mlp.experts.36.up_proj", "model.layers.74.mlp.experts.37.up_proj", "model.layers.74.mlp.experts.38.up_proj", "model.layers.74.mlp.experts.39.up_proj", "model.layers.74.mlp.experts.40.up_proj", "model.layers.74.mlp.experts.41.up_proj", "model.layers.74.mlp.experts.42.up_proj", "model.layers.74.mlp.experts.43.up_proj", "model.layers.74.mlp.experts.44.up_proj", "model.layers.74.mlp.experts.45.up_proj", "model.layers.74.mlp.experts.46.up_proj", "model.layers.74.mlp.experts.47.up_proj", "model.layers.74.mlp.experts.48.up_proj", "model.layers.74.mlp.experts.49.up_proj", "model.layers.74.mlp.experts.50.up_proj", "model.layers.74.mlp.experts.51.up_proj", "model.layers.74.mlp.experts.52.up_proj", "model.layers.74.mlp.experts.53.up_proj", "model.layers.74.mlp.experts.54.up_proj", "model.layers.74.mlp.experts.55.up_proj", "model.layers.74.mlp.experts.56.up_proj", "model.layers.74.mlp.experts.57.up_proj", "model.layers.74.mlp.experts.58.up_proj", "model.layers.74.mlp.experts.59.up_proj", "model.layers.74.mlp.experts.60.up_proj", "model.layers.74.mlp.experts.61.up_proj", "model.layers.74.mlp.experts.62.up_proj", "model.layers.74.mlp.experts.63.up_proj", "model.layers.74.mlp.experts.64.up_proj", "model.layers.74.mlp.experts.65.up_proj", "model.layers.74.mlp.experts.66.up_proj", "model.layers.74.mlp.experts.67.up_proj", "model.layers.74.mlp.experts.68.up_proj", "model.layers.74.mlp.experts.69.up_proj", "model.layers.74.mlp.experts.70.up_proj", "model.layers.74.mlp.experts.71.up_proj", "model.layers.74.mlp.experts.72.up_proj", "model.layers.74.mlp.experts.73.up_proj", "model.layers.74.mlp.experts.74.up_proj", "model.layers.74.mlp.experts.75.up_proj", "model.layers.74.mlp.experts.76.up_proj", "model.layers.74.mlp.experts.77.up_proj", "model.layers.74.mlp.experts.78.up_proj", "model.layers.74.mlp.experts.79.up_proj", "model.layers.74.mlp.experts.80.up_proj", "model.layers.74.mlp.experts.81.up_proj", "model.layers.74.mlp.experts.82.up_proj", "model.layers.74.mlp.experts.83.up_proj", "model.layers.74.mlp.experts.84.up_proj", "model.layers.74.mlp.experts.85.up_proj", "model.layers.74.mlp.experts.86.up_proj", "model.layers.74.mlp.experts.87.up_proj", "model.layers.74.mlp.experts.88.up_proj", "model.layers.74.mlp.experts.89.up_proj", "model.layers.74.mlp.experts.90.up_proj", "model.layers.74.mlp.experts.91.up_proj", "model.layers.74.mlp.experts.92.up_proj", "model.layers.74.mlp.experts.93.up_proj", "model.layers.74.mlp.experts.94.up_proj", "model.layers.74.mlp.experts.95.up_proj", "model.layers.74.mlp.experts.96.up_proj", "model.layers.74.mlp.experts.97.up_proj", "model.layers.74.mlp.experts.98.up_proj", "model.layers.74.mlp.experts.99.up_proj", "model.layers.74.mlp.experts.100.up_proj", "model.layers.74.mlp.experts.101.up_proj", "model.layers.74.mlp.experts.102.up_proj", "model.layers.74.mlp.experts.103.up_proj", "model.layers.74.mlp.experts.104.up_proj", "model.layers.74.mlp.experts.105.up_proj", "model.layers.74.mlp.experts.106.up_proj", "model.layers.74.mlp.experts.107.up_proj", "model.layers.74.mlp.experts.108.up_proj", "model.layers.74.mlp.experts.109.up_proj", "model.layers.74.mlp.experts.110.up_proj", "model.layers.74.mlp.experts.111.up_proj", "model.layers.74.mlp.experts.112.up_proj", "model.layers.74.mlp.experts.113.up_proj", "model.layers.74.mlp.experts.114.up_proj", "model.layers.74.mlp.experts.115.up_proj", "model.layers.74.mlp.experts.116.up_proj", "model.layers.74.mlp.experts.117.up_proj", "model.layers.74.mlp.experts.118.up_proj", "model.layers.74.mlp.experts.119.up_proj", "model.layers.74.mlp.experts.120.up_proj", "model.layers.74.mlp.experts.121.up_proj", "model.layers.74.mlp.experts.122.up_proj", "model.layers.74.mlp.experts.123.up_proj", "model.layers.74.mlp.experts.124.up_proj", "model.layers.74.mlp.experts.125.up_proj", "model.layers.74.mlp.experts.126.up_proj", "model.layers.74.mlp.experts.127.up_proj", "model.layers.74.mlp.experts.128.up_proj", "model.layers.74.mlp.experts.129.up_proj", "model.layers.74.mlp.experts.130.up_proj", "model.layers.74.mlp.experts.131.up_proj", "model.layers.74.mlp.experts.132.up_proj", "model.layers.74.mlp.experts.133.up_proj", "model.layers.74.mlp.experts.134.up_proj", "model.layers.74.mlp.experts.135.up_proj", "model.layers.74.mlp.experts.136.up_proj", "model.layers.74.mlp.experts.137.up_proj", "model.layers.74.mlp.experts.138.up_proj", "model.layers.74.mlp.experts.139.up_proj", "model.layers.74.mlp.experts.140.up_proj", "model.layers.74.mlp.experts.141.up_proj", "model.layers.74.mlp.experts.142.up_proj", "model.layers.74.mlp.experts.143.up_proj", "model.layers.74.mlp.experts.144.up_proj", "model.layers.74.mlp.experts.145.up_proj", "model.layers.74.mlp.experts.146.up_proj", "model.layers.74.mlp.experts.147.up_proj", "model.layers.74.mlp.experts.148.up_proj", "model.layers.74.mlp.experts.149.up_proj", "model.layers.74.mlp.experts.150.up_proj", "model.layers.74.mlp.experts.151.up_proj", "model.layers.74.mlp.experts.152.up_proj", "model.layers.74.mlp.experts.153.up_proj", "model.layers.74.mlp.experts.154.up_proj", "model.layers.74.mlp.experts.155.up_proj", "model.layers.74.mlp.experts.156.up_proj", "model.layers.74.mlp.experts.157.up_proj", "model.layers.74.mlp.experts.158.up_proj", "model.layers.74.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.5921890735640098e-06, "dbits": 2516582400 }, { "dkld": -8.868728764354836e-06, "dbits": 5033164800 } ] }, { "idx": 446, "layers": [ "model.layers.74.mlp.experts.0.down_proj", "model.layers.74.mlp.experts.1.down_proj", "model.layers.74.mlp.experts.2.down_proj", "model.layers.74.mlp.experts.3.down_proj", "model.layers.74.mlp.experts.4.down_proj", "model.layers.74.mlp.experts.5.down_proj", "model.layers.74.mlp.experts.6.down_proj", "model.layers.74.mlp.experts.7.down_proj", "model.layers.74.mlp.experts.8.down_proj", "model.layers.74.mlp.experts.9.down_proj", "model.layers.74.mlp.experts.10.down_proj", "model.layers.74.mlp.experts.11.down_proj", "model.layers.74.mlp.experts.12.down_proj", "model.layers.74.mlp.experts.13.down_proj", "model.layers.74.mlp.experts.14.down_proj", "model.layers.74.mlp.experts.15.down_proj", "model.layers.74.mlp.experts.16.down_proj", "model.layers.74.mlp.experts.17.down_proj", "model.layers.74.mlp.experts.18.down_proj", "model.layers.74.mlp.experts.19.down_proj", "model.layers.74.mlp.experts.20.down_proj", "model.layers.74.mlp.experts.21.down_proj", "model.layers.74.mlp.experts.22.down_proj", "model.layers.74.mlp.experts.23.down_proj", "model.layers.74.mlp.experts.24.down_proj", "model.layers.74.mlp.experts.25.down_proj", "model.layers.74.mlp.experts.26.down_proj", "model.layers.74.mlp.experts.27.down_proj", "model.layers.74.mlp.experts.28.down_proj", "model.layers.74.mlp.experts.29.down_proj", "model.layers.74.mlp.experts.30.down_proj", "model.layers.74.mlp.experts.31.down_proj", "model.layers.74.mlp.experts.32.down_proj", "model.layers.74.mlp.experts.33.down_proj", "model.layers.74.mlp.experts.34.down_proj", "model.layers.74.mlp.experts.35.down_proj", "model.layers.74.mlp.experts.36.down_proj", "model.layers.74.mlp.experts.37.down_proj", "model.layers.74.mlp.experts.38.down_proj", "model.layers.74.mlp.experts.39.down_proj", "model.layers.74.mlp.experts.40.down_proj", "model.layers.74.mlp.experts.41.down_proj", "model.layers.74.mlp.experts.42.down_proj", "model.layers.74.mlp.experts.43.down_proj", "model.layers.74.mlp.experts.44.down_proj", "model.layers.74.mlp.experts.45.down_proj", "model.layers.74.mlp.experts.46.down_proj", "model.layers.74.mlp.experts.47.down_proj", "model.layers.74.mlp.experts.48.down_proj", "model.layers.74.mlp.experts.49.down_proj", "model.layers.74.mlp.experts.50.down_proj", "model.layers.74.mlp.experts.51.down_proj", "model.layers.74.mlp.experts.52.down_proj", "model.layers.74.mlp.experts.53.down_proj", "model.layers.74.mlp.experts.54.down_proj", "model.layers.74.mlp.experts.55.down_proj", "model.layers.74.mlp.experts.56.down_proj", "model.layers.74.mlp.experts.57.down_proj", "model.layers.74.mlp.experts.58.down_proj", "model.layers.74.mlp.experts.59.down_proj", "model.layers.74.mlp.experts.60.down_proj", "model.layers.74.mlp.experts.61.down_proj", "model.layers.74.mlp.experts.62.down_proj", "model.layers.74.mlp.experts.63.down_proj", "model.layers.74.mlp.experts.64.down_proj", "model.layers.74.mlp.experts.65.down_proj", "model.layers.74.mlp.experts.66.down_proj", "model.layers.74.mlp.experts.67.down_proj", "model.layers.74.mlp.experts.68.down_proj", "model.layers.74.mlp.experts.69.down_proj", "model.layers.74.mlp.experts.70.down_proj", "model.layers.74.mlp.experts.71.down_proj", "model.layers.74.mlp.experts.72.down_proj", "model.layers.74.mlp.experts.73.down_proj", "model.layers.74.mlp.experts.74.down_proj", "model.layers.74.mlp.experts.75.down_proj", "model.layers.74.mlp.experts.76.down_proj", "model.layers.74.mlp.experts.77.down_proj", "model.layers.74.mlp.experts.78.down_proj", "model.layers.74.mlp.experts.79.down_proj", "model.layers.74.mlp.experts.80.down_proj", "model.layers.74.mlp.experts.81.down_proj", "model.layers.74.mlp.experts.82.down_proj", "model.layers.74.mlp.experts.83.down_proj", "model.layers.74.mlp.experts.84.down_proj", "model.layers.74.mlp.experts.85.down_proj", "model.layers.74.mlp.experts.86.down_proj", "model.layers.74.mlp.experts.87.down_proj", "model.layers.74.mlp.experts.88.down_proj", "model.layers.74.mlp.experts.89.down_proj", "model.layers.74.mlp.experts.90.down_proj", "model.layers.74.mlp.experts.91.down_proj", "model.layers.74.mlp.experts.92.down_proj", "model.layers.74.mlp.experts.93.down_proj", "model.layers.74.mlp.experts.94.down_proj", "model.layers.74.mlp.experts.95.down_proj", "model.layers.74.mlp.experts.96.down_proj", "model.layers.74.mlp.experts.97.down_proj", "model.layers.74.mlp.experts.98.down_proj", "model.layers.74.mlp.experts.99.down_proj", "model.layers.74.mlp.experts.100.down_proj", "model.layers.74.mlp.experts.101.down_proj", "model.layers.74.mlp.experts.102.down_proj", "model.layers.74.mlp.experts.103.down_proj", "model.layers.74.mlp.experts.104.down_proj", "model.layers.74.mlp.experts.105.down_proj", "model.layers.74.mlp.experts.106.down_proj", "model.layers.74.mlp.experts.107.down_proj", "model.layers.74.mlp.experts.108.down_proj", "model.layers.74.mlp.experts.109.down_proj", "model.layers.74.mlp.experts.110.down_proj", "model.layers.74.mlp.experts.111.down_proj", "model.layers.74.mlp.experts.112.down_proj", "model.layers.74.mlp.experts.113.down_proj", "model.layers.74.mlp.experts.114.down_proj", "model.layers.74.mlp.experts.115.down_proj", "model.layers.74.mlp.experts.116.down_proj", "model.layers.74.mlp.experts.117.down_proj", "model.layers.74.mlp.experts.118.down_proj", "model.layers.74.mlp.experts.119.down_proj", "model.layers.74.mlp.experts.120.down_proj", "model.layers.74.mlp.experts.121.down_proj", "model.layers.74.mlp.experts.122.down_proj", "model.layers.74.mlp.experts.123.down_proj", "model.layers.74.mlp.experts.124.down_proj", "model.layers.74.mlp.experts.125.down_proj", "model.layers.74.mlp.experts.126.down_proj", "model.layers.74.mlp.experts.127.down_proj", "model.layers.74.mlp.experts.128.down_proj", "model.layers.74.mlp.experts.129.down_proj", "model.layers.74.mlp.experts.130.down_proj", "model.layers.74.mlp.experts.131.down_proj", "model.layers.74.mlp.experts.132.down_proj", "model.layers.74.mlp.experts.133.down_proj", "model.layers.74.mlp.experts.134.down_proj", "model.layers.74.mlp.experts.135.down_proj", "model.layers.74.mlp.experts.136.down_proj", "model.layers.74.mlp.experts.137.down_proj", "model.layers.74.mlp.experts.138.down_proj", "model.layers.74.mlp.experts.139.down_proj", "model.layers.74.mlp.experts.140.down_proj", "model.layers.74.mlp.experts.141.down_proj", "model.layers.74.mlp.experts.142.down_proj", "model.layers.74.mlp.experts.143.down_proj", "model.layers.74.mlp.experts.144.down_proj", "model.layers.74.mlp.experts.145.down_proj", "model.layers.74.mlp.experts.146.down_proj", "model.layers.74.mlp.experts.147.down_proj", "model.layers.74.mlp.experts.148.down_proj", "model.layers.74.mlp.experts.149.down_proj", "model.layers.74.mlp.experts.150.down_proj", "model.layers.74.mlp.experts.151.down_proj", "model.layers.74.mlp.experts.152.down_proj", "model.layers.74.mlp.experts.153.down_proj", "model.layers.74.mlp.experts.154.down_proj", "model.layers.74.mlp.experts.155.down_proj", "model.layers.74.mlp.experts.156.down_proj", "model.layers.74.mlp.experts.157.down_proj", "model.layers.74.mlp.experts.158.down_proj", "model.layers.74.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.7143163606524467e-05, "dbits": 1258291200 }, { "dkld": -2.601812593638897e-05, "dbits": 2516582400 } ] }, { "idx": 447, "layers": [ "model.layers.75.self_attn.q_proj" ], "candidates": [ { "dkld": -2.642259933054343e-05, "dbits": 62914560 }, { "dkld": -5.351193249224576e-06, "dbits": 125829120 } ] }, { "idx": 448, "layers": [ "model.layers.75.self_attn.k_proj", "model.layers.75.self_attn.v_proj" ], "candidates": [ { "dkld": -3.7828925997015345e-06, "dbits": 10485760 }, { "dkld": 3.3151591196656227e-06, "dbits": 20971520 } ] }, { "idx": 449, "layers": [ "model.layers.75.self_attn.o_proj" ], "candidates": [ { "dkld": 3.3169519156224514e-06, "dbits": 62914560 }, { "dkld": -7.6101627200838434e-06, "dbits": 125829120 } ] }, { "idx": 450, "layers": [ "model.layers.75.mlp.shared_experts.gate_proj", "model.layers.75.mlp.shared_experts.up_proj", "model.layers.75.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -4.832767881452968e-05, "dbits": 23592960 }, { "dkld": -4.006093367934192e-05, "dbits": 47185920 } ] }, { "idx": 451, "layers": [ "model.layers.75.mlp.experts.0.gate_proj", "model.layers.75.mlp.experts.1.gate_proj", "model.layers.75.mlp.experts.2.gate_proj", "model.layers.75.mlp.experts.3.gate_proj", "model.layers.75.mlp.experts.4.gate_proj", "model.layers.75.mlp.experts.5.gate_proj", "model.layers.75.mlp.experts.6.gate_proj", "model.layers.75.mlp.experts.7.gate_proj", "model.layers.75.mlp.experts.8.gate_proj", "model.layers.75.mlp.experts.9.gate_proj", "model.layers.75.mlp.experts.10.gate_proj", "model.layers.75.mlp.experts.11.gate_proj", "model.layers.75.mlp.experts.12.gate_proj", "model.layers.75.mlp.experts.13.gate_proj", "model.layers.75.mlp.experts.14.gate_proj", "model.layers.75.mlp.experts.15.gate_proj", "model.layers.75.mlp.experts.16.gate_proj", "model.layers.75.mlp.experts.17.gate_proj", "model.layers.75.mlp.experts.18.gate_proj", "model.layers.75.mlp.experts.19.gate_proj", "model.layers.75.mlp.experts.20.gate_proj", "model.layers.75.mlp.experts.21.gate_proj", "model.layers.75.mlp.experts.22.gate_proj", "model.layers.75.mlp.experts.23.gate_proj", "model.layers.75.mlp.experts.24.gate_proj", "model.layers.75.mlp.experts.25.gate_proj", "model.layers.75.mlp.experts.26.gate_proj", "model.layers.75.mlp.experts.27.gate_proj", "model.layers.75.mlp.experts.28.gate_proj", "model.layers.75.mlp.experts.29.gate_proj", "model.layers.75.mlp.experts.30.gate_proj", "model.layers.75.mlp.experts.31.gate_proj", "model.layers.75.mlp.experts.32.gate_proj", "model.layers.75.mlp.experts.33.gate_proj", "model.layers.75.mlp.experts.34.gate_proj", "model.layers.75.mlp.experts.35.gate_proj", "model.layers.75.mlp.experts.36.gate_proj", "model.layers.75.mlp.experts.37.gate_proj", "model.layers.75.mlp.experts.38.gate_proj", "model.layers.75.mlp.experts.39.gate_proj", "model.layers.75.mlp.experts.40.gate_proj", "model.layers.75.mlp.experts.41.gate_proj", "model.layers.75.mlp.experts.42.gate_proj", "model.layers.75.mlp.experts.43.gate_proj", "model.layers.75.mlp.experts.44.gate_proj", "model.layers.75.mlp.experts.45.gate_proj", "model.layers.75.mlp.experts.46.gate_proj", "model.layers.75.mlp.experts.47.gate_proj", "model.layers.75.mlp.experts.48.gate_proj", "model.layers.75.mlp.experts.49.gate_proj", "model.layers.75.mlp.experts.50.gate_proj", "model.layers.75.mlp.experts.51.gate_proj", "model.layers.75.mlp.experts.52.gate_proj", "model.layers.75.mlp.experts.53.gate_proj", "model.layers.75.mlp.experts.54.gate_proj", "model.layers.75.mlp.experts.55.gate_proj", "model.layers.75.mlp.experts.56.gate_proj", "model.layers.75.mlp.experts.57.gate_proj", "model.layers.75.mlp.experts.58.gate_proj", "model.layers.75.mlp.experts.59.gate_proj", "model.layers.75.mlp.experts.60.gate_proj", "model.layers.75.mlp.experts.61.gate_proj", "model.layers.75.mlp.experts.62.gate_proj", "model.layers.75.mlp.experts.63.gate_proj", "model.layers.75.mlp.experts.64.gate_proj", "model.layers.75.mlp.experts.65.gate_proj", "model.layers.75.mlp.experts.66.gate_proj", "model.layers.75.mlp.experts.67.gate_proj", "model.layers.75.mlp.experts.68.gate_proj", "model.layers.75.mlp.experts.69.gate_proj", "model.layers.75.mlp.experts.70.gate_proj", "model.layers.75.mlp.experts.71.gate_proj", "model.layers.75.mlp.experts.72.gate_proj", "model.layers.75.mlp.experts.73.gate_proj", "model.layers.75.mlp.experts.74.gate_proj", "model.layers.75.mlp.experts.75.gate_proj", "model.layers.75.mlp.experts.76.gate_proj", "model.layers.75.mlp.experts.77.gate_proj", "model.layers.75.mlp.experts.78.gate_proj", "model.layers.75.mlp.experts.79.gate_proj", "model.layers.75.mlp.experts.80.gate_proj", "model.layers.75.mlp.experts.81.gate_proj", "model.layers.75.mlp.experts.82.gate_proj", "model.layers.75.mlp.experts.83.gate_proj", "model.layers.75.mlp.experts.84.gate_proj", "model.layers.75.mlp.experts.85.gate_proj", "model.layers.75.mlp.experts.86.gate_proj", "model.layers.75.mlp.experts.87.gate_proj", "model.layers.75.mlp.experts.88.gate_proj", "model.layers.75.mlp.experts.89.gate_proj", "model.layers.75.mlp.experts.90.gate_proj", "model.layers.75.mlp.experts.91.gate_proj", "model.layers.75.mlp.experts.92.gate_proj", "model.layers.75.mlp.experts.93.gate_proj", "model.layers.75.mlp.experts.94.gate_proj", "model.layers.75.mlp.experts.95.gate_proj", "model.layers.75.mlp.experts.96.gate_proj", "model.layers.75.mlp.experts.97.gate_proj", "model.layers.75.mlp.experts.98.gate_proj", "model.layers.75.mlp.experts.99.gate_proj", "model.layers.75.mlp.experts.100.gate_proj", "model.layers.75.mlp.experts.101.gate_proj", "model.layers.75.mlp.experts.102.gate_proj", "model.layers.75.mlp.experts.103.gate_proj", "model.layers.75.mlp.experts.104.gate_proj", "model.layers.75.mlp.experts.105.gate_proj", "model.layers.75.mlp.experts.106.gate_proj", "model.layers.75.mlp.experts.107.gate_proj", "model.layers.75.mlp.experts.108.gate_proj", "model.layers.75.mlp.experts.109.gate_proj", "model.layers.75.mlp.experts.110.gate_proj", "model.layers.75.mlp.experts.111.gate_proj", "model.layers.75.mlp.experts.112.gate_proj", "model.layers.75.mlp.experts.113.gate_proj", "model.layers.75.mlp.experts.114.gate_proj", "model.layers.75.mlp.experts.115.gate_proj", "model.layers.75.mlp.experts.116.gate_proj", "model.layers.75.mlp.experts.117.gate_proj", "model.layers.75.mlp.experts.118.gate_proj", "model.layers.75.mlp.experts.119.gate_proj", "model.layers.75.mlp.experts.120.gate_proj", "model.layers.75.mlp.experts.121.gate_proj", "model.layers.75.mlp.experts.122.gate_proj", "model.layers.75.mlp.experts.123.gate_proj", "model.layers.75.mlp.experts.124.gate_proj", "model.layers.75.mlp.experts.125.gate_proj", "model.layers.75.mlp.experts.126.gate_proj", "model.layers.75.mlp.experts.127.gate_proj", "model.layers.75.mlp.experts.128.gate_proj", "model.layers.75.mlp.experts.129.gate_proj", "model.layers.75.mlp.experts.130.gate_proj", "model.layers.75.mlp.experts.131.gate_proj", "model.layers.75.mlp.experts.132.gate_proj", "model.layers.75.mlp.experts.133.gate_proj", "model.layers.75.mlp.experts.134.gate_proj", "model.layers.75.mlp.experts.135.gate_proj", "model.layers.75.mlp.experts.136.gate_proj", "model.layers.75.mlp.experts.137.gate_proj", "model.layers.75.mlp.experts.138.gate_proj", "model.layers.75.mlp.experts.139.gate_proj", "model.layers.75.mlp.experts.140.gate_proj", "model.layers.75.mlp.experts.141.gate_proj", "model.layers.75.mlp.experts.142.gate_proj", "model.layers.75.mlp.experts.143.gate_proj", "model.layers.75.mlp.experts.144.gate_proj", "model.layers.75.mlp.experts.145.gate_proj", "model.layers.75.mlp.experts.146.gate_proj", "model.layers.75.mlp.experts.147.gate_proj", "model.layers.75.mlp.experts.148.gate_proj", "model.layers.75.mlp.experts.149.gate_proj", "model.layers.75.mlp.experts.150.gate_proj", "model.layers.75.mlp.experts.151.gate_proj", "model.layers.75.mlp.experts.152.gate_proj", "model.layers.75.mlp.experts.153.gate_proj", "model.layers.75.mlp.experts.154.gate_proj", "model.layers.75.mlp.experts.155.gate_proj", "model.layers.75.mlp.experts.156.gate_proj", "model.layers.75.mlp.experts.157.gate_proj", "model.layers.75.mlp.experts.158.gate_proj", "model.layers.75.mlp.experts.159.gate_proj", "model.layers.75.mlp.experts.0.up_proj", "model.layers.75.mlp.experts.1.up_proj", "model.layers.75.mlp.experts.2.up_proj", "model.layers.75.mlp.experts.3.up_proj", "model.layers.75.mlp.experts.4.up_proj", "model.layers.75.mlp.experts.5.up_proj", "model.layers.75.mlp.experts.6.up_proj", "model.layers.75.mlp.experts.7.up_proj", "model.layers.75.mlp.experts.8.up_proj", "model.layers.75.mlp.experts.9.up_proj", "model.layers.75.mlp.experts.10.up_proj", "model.layers.75.mlp.experts.11.up_proj", "model.layers.75.mlp.experts.12.up_proj", "model.layers.75.mlp.experts.13.up_proj", "model.layers.75.mlp.experts.14.up_proj", "model.layers.75.mlp.experts.15.up_proj", "model.layers.75.mlp.experts.16.up_proj", "model.layers.75.mlp.experts.17.up_proj", "model.layers.75.mlp.experts.18.up_proj", "model.layers.75.mlp.experts.19.up_proj", "model.layers.75.mlp.experts.20.up_proj", "model.layers.75.mlp.experts.21.up_proj", "model.layers.75.mlp.experts.22.up_proj", "model.layers.75.mlp.experts.23.up_proj", "model.layers.75.mlp.experts.24.up_proj", "model.layers.75.mlp.experts.25.up_proj", "model.layers.75.mlp.experts.26.up_proj", "model.layers.75.mlp.experts.27.up_proj", "model.layers.75.mlp.experts.28.up_proj", "model.layers.75.mlp.experts.29.up_proj", "model.layers.75.mlp.experts.30.up_proj", "model.layers.75.mlp.experts.31.up_proj", "model.layers.75.mlp.experts.32.up_proj", "model.layers.75.mlp.experts.33.up_proj", "model.layers.75.mlp.experts.34.up_proj", "model.layers.75.mlp.experts.35.up_proj", "model.layers.75.mlp.experts.36.up_proj", "model.layers.75.mlp.experts.37.up_proj", "model.layers.75.mlp.experts.38.up_proj", "model.layers.75.mlp.experts.39.up_proj", "model.layers.75.mlp.experts.40.up_proj", "model.layers.75.mlp.experts.41.up_proj", "model.layers.75.mlp.experts.42.up_proj", "model.layers.75.mlp.experts.43.up_proj", "model.layers.75.mlp.experts.44.up_proj", "model.layers.75.mlp.experts.45.up_proj", "model.layers.75.mlp.experts.46.up_proj", "model.layers.75.mlp.experts.47.up_proj", "model.layers.75.mlp.experts.48.up_proj", "model.layers.75.mlp.experts.49.up_proj", "model.layers.75.mlp.experts.50.up_proj", "model.layers.75.mlp.experts.51.up_proj", "model.layers.75.mlp.experts.52.up_proj", "model.layers.75.mlp.experts.53.up_proj", "model.layers.75.mlp.experts.54.up_proj", "model.layers.75.mlp.experts.55.up_proj", "model.layers.75.mlp.experts.56.up_proj", "model.layers.75.mlp.experts.57.up_proj", "model.layers.75.mlp.experts.58.up_proj", "model.layers.75.mlp.experts.59.up_proj", "model.layers.75.mlp.experts.60.up_proj", "model.layers.75.mlp.experts.61.up_proj", "model.layers.75.mlp.experts.62.up_proj", "model.layers.75.mlp.experts.63.up_proj", "model.layers.75.mlp.experts.64.up_proj", "model.layers.75.mlp.experts.65.up_proj", "model.layers.75.mlp.experts.66.up_proj", "model.layers.75.mlp.experts.67.up_proj", "model.layers.75.mlp.experts.68.up_proj", "model.layers.75.mlp.experts.69.up_proj", "model.layers.75.mlp.experts.70.up_proj", "model.layers.75.mlp.experts.71.up_proj", "model.layers.75.mlp.experts.72.up_proj", "model.layers.75.mlp.experts.73.up_proj", "model.layers.75.mlp.experts.74.up_proj", "model.layers.75.mlp.experts.75.up_proj", "model.layers.75.mlp.experts.76.up_proj", "model.layers.75.mlp.experts.77.up_proj", "model.layers.75.mlp.experts.78.up_proj", "model.layers.75.mlp.experts.79.up_proj", "model.layers.75.mlp.experts.80.up_proj", "model.layers.75.mlp.experts.81.up_proj", "model.layers.75.mlp.experts.82.up_proj", "model.layers.75.mlp.experts.83.up_proj", "model.layers.75.mlp.experts.84.up_proj", "model.layers.75.mlp.experts.85.up_proj", "model.layers.75.mlp.experts.86.up_proj", "model.layers.75.mlp.experts.87.up_proj", "model.layers.75.mlp.experts.88.up_proj", "model.layers.75.mlp.experts.89.up_proj", "model.layers.75.mlp.experts.90.up_proj", "model.layers.75.mlp.experts.91.up_proj", "model.layers.75.mlp.experts.92.up_proj", "model.layers.75.mlp.experts.93.up_proj", "model.layers.75.mlp.experts.94.up_proj", "model.layers.75.mlp.experts.95.up_proj", "model.layers.75.mlp.experts.96.up_proj", "model.layers.75.mlp.experts.97.up_proj", "model.layers.75.mlp.experts.98.up_proj", "model.layers.75.mlp.experts.99.up_proj", "model.layers.75.mlp.experts.100.up_proj", "model.layers.75.mlp.experts.101.up_proj", "model.layers.75.mlp.experts.102.up_proj", "model.layers.75.mlp.experts.103.up_proj", "model.layers.75.mlp.experts.104.up_proj", "model.layers.75.mlp.experts.105.up_proj", "model.layers.75.mlp.experts.106.up_proj", "model.layers.75.mlp.experts.107.up_proj", "model.layers.75.mlp.experts.108.up_proj", "model.layers.75.mlp.experts.109.up_proj", "model.layers.75.mlp.experts.110.up_proj", "model.layers.75.mlp.experts.111.up_proj", "model.layers.75.mlp.experts.112.up_proj", "model.layers.75.mlp.experts.113.up_proj", "model.layers.75.mlp.experts.114.up_proj", "model.layers.75.mlp.experts.115.up_proj", "model.layers.75.mlp.experts.116.up_proj", "model.layers.75.mlp.experts.117.up_proj", "model.layers.75.mlp.experts.118.up_proj", "model.layers.75.mlp.experts.119.up_proj", "model.layers.75.mlp.experts.120.up_proj", "model.layers.75.mlp.experts.121.up_proj", "model.layers.75.mlp.experts.122.up_proj", "model.layers.75.mlp.experts.123.up_proj", "model.layers.75.mlp.experts.124.up_proj", "model.layers.75.mlp.experts.125.up_proj", "model.layers.75.mlp.experts.126.up_proj", "model.layers.75.mlp.experts.127.up_proj", "model.layers.75.mlp.experts.128.up_proj", "model.layers.75.mlp.experts.129.up_proj", "model.layers.75.mlp.experts.130.up_proj", "model.layers.75.mlp.experts.131.up_proj", "model.layers.75.mlp.experts.132.up_proj", "model.layers.75.mlp.experts.133.up_proj", "model.layers.75.mlp.experts.134.up_proj", "model.layers.75.mlp.experts.135.up_proj", "model.layers.75.mlp.experts.136.up_proj", "model.layers.75.mlp.experts.137.up_proj", "model.layers.75.mlp.experts.138.up_proj", "model.layers.75.mlp.experts.139.up_proj", "model.layers.75.mlp.experts.140.up_proj", "model.layers.75.mlp.experts.141.up_proj", "model.layers.75.mlp.experts.142.up_proj", "model.layers.75.mlp.experts.143.up_proj", "model.layers.75.mlp.experts.144.up_proj", "model.layers.75.mlp.experts.145.up_proj", "model.layers.75.mlp.experts.146.up_proj", "model.layers.75.mlp.experts.147.up_proj", "model.layers.75.mlp.experts.148.up_proj", "model.layers.75.mlp.experts.149.up_proj", "model.layers.75.mlp.experts.150.up_proj", "model.layers.75.mlp.experts.151.up_proj", "model.layers.75.mlp.experts.152.up_proj", "model.layers.75.mlp.experts.153.up_proj", "model.layers.75.mlp.experts.154.up_proj", "model.layers.75.mlp.experts.155.up_proj", "model.layers.75.mlp.experts.156.up_proj", "model.layers.75.mlp.experts.157.up_proj", "model.layers.75.mlp.experts.158.up_proj", "model.layers.75.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.4135975874960076e-05, "dbits": 2516582400 }, { "dkld": -2.516757231205667e-05, "dbits": 5033164800 } ] }, { "idx": 452, "layers": [ "model.layers.75.mlp.experts.0.down_proj", "model.layers.75.mlp.experts.1.down_proj", "model.layers.75.mlp.experts.2.down_proj", "model.layers.75.mlp.experts.3.down_proj", "model.layers.75.mlp.experts.4.down_proj", "model.layers.75.mlp.experts.5.down_proj", "model.layers.75.mlp.experts.6.down_proj", "model.layers.75.mlp.experts.7.down_proj", "model.layers.75.mlp.experts.8.down_proj", "model.layers.75.mlp.experts.9.down_proj", "model.layers.75.mlp.experts.10.down_proj", "model.layers.75.mlp.experts.11.down_proj", "model.layers.75.mlp.experts.12.down_proj", "model.layers.75.mlp.experts.13.down_proj", "model.layers.75.mlp.experts.14.down_proj", "model.layers.75.mlp.experts.15.down_proj", "model.layers.75.mlp.experts.16.down_proj", "model.layers.75.mlp.experts.17.down_proj", "model.layers.75.mlp.experts.18.down_proj", "model.layers.75.mlp.experts.19.down_proj", "model.layers.75.mlp.experts.20.down_proj", "model.layers.75.mlp.experts.21.down_proj", "model.layers.75.mlp.experts.22.down_proj", "model.layers.75.mlp.experts.23.down_proj", "model.layers.75.mlp.experts.24.down_proj", "model.layers.75.mlp.experts.25.down_proj", "model.layers.75.mlp.experts.26.down_proj", "model.layers.75.mlp.experts.27.down_proj", "model.layers.75.mlp.experts.28.down_proj", "model.layers.75.mlp.experts.29.down_proj", "model.layers.75.mlp.experts.30.down_proj", "model.layers.75.mlp.experts.31.down_proj", "model.layers.75.mlp.experts.32.down_proj", "model.layers.75.mlp.experts.33.down_proj", "model.layers.75.mlp.experts.34.down_proj", "model.layers.75.mlp.experts.35.down_proj", "model.layers.75.mlp.experts.36.down_proj", "model.layers.75.mlp.experts.37.down_proj", "model.layers.75.mlp.experts.38.down_proj", "model.layers.75.mlp.experts.39.down_proj", "model.layers.75.mlp.experts.40.down_proj", "model.layers.75.mlp.experts.41.down_proj", "model.layers.75.mlp.experts.42.down_proj", "model.layers.75.mlp.experts.43.down_proj", "model.layers.75.mlp.experts.44.down_proj", "model.layers.75.mlp.experts.45.down_proj", "model.layers.75.mlp.experts.46.down_proj", "model.layers.75.mlp.experts.47.down_proj", "model.layers.75.mlp.experts.48.down_proj", "model.layers.75.mlp.experts.49.down_proj", "model.layers.75.mlp.experts.50.down_proj", "model.layers.75.mlp.experts.51.down_proj", "model.layers.75.mlp.experts.52.down_proj", "model.layers.75.mlp.experts.53.down_proj", "model.layers.75.mlp.experts.54.down_proj", "model.layers.75.mlp.experts.55.down_proj", "model.layers.75.mlp.experts.56.down_proj", "model.layers.75.mlp.experts.57.down_proj", "model.layers.75.mlp.experts.58.down_proj", "model.layers.75.mlp.experts.59.down_proj", "model.layers.75.mlp.experts.60.down_proj", "model.layers.75.mlp.experts.61.down_proj", "model.layers.75.mlp.experts.62.down_proj", "model.layers.75.mlp.experts.63.down_proj", "model.layers.75.mlp.experts.64.down_proj", "model.layers.75.mlp.experts.65.down_proj", "model.layers.75.mlp.experts.66.down_proj", "model.layers.75.mlp.experts.67.down_proj", "model.layers.75.mlp.experts.68.down_proj", "model.layers.75.mlp.experts.69.down_proj", "model.layers.75.mlp.experts.70.down_proj", "model.layers.75.mlp.experts.71.down_proj", "model.layers.75.mlp.experts.72.down_proj", "model.layers.75.mlp.experts.73.down_proj", "model.layers.75.mlp.experts.74.down_proj", "model.layers.75.mlp.experts.75.down_proj", "model.layers.75.mlp.experts.76.down_proj", "model.layers.75.mlp.experts.77.down_proj", "model.layers.75.mlp.experts.78.down_proj", "model.layers.75.mlp.experts.79.down_proj", "model.layers.75.mlp.experts.80.down_proj", "model.layers.75.mlp.experts.81.down_proj", "model.layers.75.mlp.experts.82.down_proj", "model.layers.75.mlp.experts.83.down_proj", "model.layers.75.mlp.experts.84.down_proj", "model.layers.75.mlp.experts.85.down_proj", "model.layers.75.mlp.experts.86.down_proj", "model.layers.75.mlp.experts.87.down_proj", "model.layers.75.mlp.experts.88.down_proj", "model.layers.75.mlp.experts.89.down_proj", "model.layers.75.mlp.experts.90.down_proj", "model.layers.75.mlp.experts.91.down_proj", "model.layers.75.mlp.experts.92.down_proj", "model.layers.75.mlp.experts.93.down_proj", "model.layers.75.mlp.experts.94.down_proj", "model.layers.75.mlp.experts.95.down_proj", "model.layers.75.mlp.experts.96.down_proj", "model.layers.75.mlp.experts.97.down_proj", "model.layers.75.mlp.experts.98.down_proj", "model.layers.75.mlp.experts.99.down_proj", "model.layers.75.mlp.experts.100.down_proj", "model.layers.75.mlp.experts.101.down_proj", "model.layers.75.mlp.experts.102.down_proj", "model.layers.75.mlp.experts.103.down_proj", "model.layers.75.mlp.experts.104.down_proj", "model.layers.75.mlp.experts.105.down_proj", "model.layers.75.mlp.experts.106.down_proj", "model.layers.75.mlp.experts.107.down_proj", "model.layers.75.mlp.experts.108.down_proj", "model.layers.75.mlp.experts.109.down_proj", "model.layers.75.mlp.experts.110.down_proj", "model.layers.75.mlp.experts.111.down_proj", "model.layers.75.mlp.experts.112.down_proj", "model.layers.75.mlp.experts.113.down_proj", "model.layers.75.mlp.experts.114.down_proj", "model.layers.75.mlp.experts.115.down_proj", "model.layers.75.mlp.experts.116.down_proj", "model.layers.75.mlp.experts.117.down_proj", "model.layers.75.mlp.experts.118.down_proj", "model.layers.75.mlp.experts.119.down_proj", "model.layers.75.mlp.experts.120.down_proj", "model.layers.75.mlp.experts.121.down_proj", "model.layers.75.mlp.experts.122.down_proj", "model.layers.75.mlp.experts.123.down_proj", "model.layers.75.mlp.experts.124.down_proj", "model.layers.75.mlp.experts.125.down_proj", "model.layers.75.mlp.experts.126.down_proj", "model.layers.75.mlp.experts.127.down_proj", "model.layers.75.mlp.experts.128.down_proj", "model.layers.75.mlp.experts.129.down_proj", "model.layers.75.mlp.experts.130.down_proj", "model.layers.75.mlp.experts.131.down_proj", "model.layers.75.mlp.experts.132.down_proj", "model.layers.75.mlp.experts.133.down_proj", "model.layers.75.mlp.experts.134.down_proj", "model.layers.75.mlp.experts.135.down_proj", "model.layers.75.mlp.experts.136.down_proj", "model.layers.75.mlp.experts.137.down_proj", "model.layers.75.mlp.experts.138.down_proj", "model.layers.75.mlp.experts.139.down_proj", "model.layers.75.mlp.experts.140.down_proj", "model.layers.75.mlp.experts.141.down_proj", "model.layers.75.mlp.experts.142.down_proj", "model.layers.75.mlp.experts.143.down_proj", "model.layers.75.mlp.experts.144.down_proj", "model.layers.75.mlp.experts.145.down_proj", "model.layers.75.mlp.experts.146.down_proj", "model.layers.75.mlp.experts.147.down_proj", "model.layers.75.mlp.experts.148.down_proj", "model.layers.75.mlp.experts.149.down_proj", "model.layers.75.mlp.experts.150.down_proj", "model.layers.75.mlp.experts.151.down_proj", "model.layers.75.mlp.experts.152.down_proj", "model.layers.75.mlp.experts.153.down_proj", "model.layers.75.mlp.experts.154.down_proj", "model.layers.75.mlp.experts.155.down_proj", "model.layers.75.mlp.experts.156.down_proj", "model.layers.75.mlp.experts.157.down_proj", "model.layers.75.mlp.experts.158.down_proj", "model.layers.75.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.2677861377582977e-06, "dbits": 1258291200 }, { "dkld": 2.7583446353673935e-06, "dbits": 2516582400 } ] }, { "idx": 453, "layers": [ "model.layers.76.self_attn.q_proj" ], "candidates": [ { "dkld": -0.00011461339890956809, "dbits": 62914560 }, { "dkld": -0.00010740214493125573, "dbits": 125829120 } ] }, { "idx": 454, "layers": [ "model.layers.76.self_attn.k_proj", "model.layers.76.self_attn.v_proj" ], "candidates": [ { "dkld": -4.1483319364488125e-05, "dbits": 10485760 }, { "dkld": -4.284260794520239e-05, "dbits": 20971520 } ] }, { "idx": 455, "layers": [ "model.layers.76.self_attn.o_proj" ], "candidates": [ { "dkld": -7.515796460209889e-06, "dbits": 62914560 }, { "dkld": -2.498310059308867e-05, "dbits": 125829120 } ] }, { "idx": 456, "layers": [ "model.layers.76.mlp.shared_experts.gate_proj", "model.layers.76.mlp.shared_experts.up_proj", "model.layers.76.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -5.493210628628592e-05, "dbits": 23592960 }, { "dkld": -4.0085474029182694e-05, "dbits": 47185920 } ] }, { "idx": 457, "layers": [ "model.layers.76.mlp.experts.0.gate_proj", "model.layers.76.mlp.experts.1.gate_proj", "model.layers.76.mlp.experts.2.gate_proj", "model.layers.76.mlp.experts.3.gate_proj", "model.layers.76.mlp.experts.4.gate_proj", "model.layers.76.mlp.experts.5.gate_proj", "model.layers.76.mlp.experts.6.gate_proj", "model.layers.76.mlp.experts.7.gate_proj", "model.layers.76.mlp.experts.8.gate_proj", "model.layers.76.mlp.experts.9.gate_proj", "model.layers.76.mlp.experts.10.gate_proj", "model.layers.76.mlp.experts.11.gate_proj", "model.layers.76.mlp.experts.12.gate_proj", "model.layers.76.mlp.experts.13.gate_proj", "model.layers.76.mlp.experts.14.gate_proj", "model.layers.76.mlp.experts.15.gate_proj", "model.layers.76.mlp.experts.16.gate_proj", "model.layers.76.mlp.experts.17.gate_proj", "model.layers.76.mlp.experts.18.gate_proj", "model.layers.76.mlp.experts.19.gate_proj", "model.layers.76.mlp.experts.20.gate_proj", "model.layers.76.mlp.experts.21.gate_proj", "model.layers.76.mlp.experts.22.gate_proj", "model.layers.76.mlp.experts.23.gate_proj", "model.layers.76.mlp.experts.24.gate_proj", "model.layers.76.mlp.experts.25.gate_proj", "model.layers.76.mlp.experts.26.gate_proj", "model.layers.76.mlp.experts.27.gate_proj", "model.layers.76.mlp.experts.28.gate_proj", "model.layers.76.mlp.experts.29.gate_proj", "model.layers.76.mlp.experts.30.gate_proj", "model.layers.76.mlp.experts.31.gate_proj", "model.layers.76.mlp.experts.32.gate_proj", "model.layers.76.mlp.experts.33.gate_proj", "model.layers.76.mlp.experts.34.gate_proj", "model.layers.76.mlp.experts.35.gate_proj", "model.layers.76.mlp.experts.36.gate_proj", "model.layers.76.mlp.experts.37.gate_proj", "model.layers.76.mlp.experts.38.gate_proj", "model.layers.76.mlp.experts.39.gate_proj", "model.layers.76.mlp.experts.40.gate_proj", "model.layers.76.mlp.experts.41.gate_proj", "model.layers.76.mlp.experts.42.gate_proj", "model.layers.76.mlp.experts.43.gate_proj", "model.layers.76.mlp.experts.44.gate_proj", "model.layers.76.mlp.experts.45.gate_proj", "model.layers.76.mlp.experts.46.gate_proj", "model.layers.76.mlp.experts.47.gate_proj", "model.layers.76.mlp.experts.48.gate_proj", "model.layers.76.mlp.experts.49.gate_proj", "model.layers.76.mlp.experts.50.gate_proj", "model.layers.76.mlp.experts.51.gate_proj", "model.layers.76.mlp.experts.52.gate_proj", "model.layers.76.mlp.experts.53.gate_proj", "model.layers.76.mlp.experts.54.gate_proj", "model.layers.76.mlp.experts.55.gate_proj", "model.layers.76.mlp.experts.56.gate_proj", "model.layers.76.mlp.experts.57.gate_proj", "model.layers.76.mlp.experts.58.gate_proj", "model.layers.76.mlp.experts.59.gate_proj", "model.layers.76.mlp.experts.60.gate_proj", "model.layers.76.mlp.experts.61.gate_proj", "model.layers.76.mlp.experts.62.gate_proj", "model.layers.76.mlp.experts.63.gate_proj", "model.layers.76.mlp.experts.64.gate_proj", "model.layers.76.mlp.experts.65.gate_proj", "model.layers.76.mlp.experts.66.gate_proj", "model.layers.76.mlp.experts.67.gate_proj", "model.layers.76.mlp.experts.68.gate_proj", "model.layers.76.mlp.experts.69.gate_proj", "model.layers.76.mlp.experts.70.gate_proj", "model.layers.76.mlp.experts.71.gate_proj", "model.layers.76.mlp.experts.72.gate_proj", "model.layers.76.mlp.experts.73.gate_proj", "model.layers.76.mlp.experts.74.gate_proj", "model.layers.76.mlp.experts.75.gate_proj", "model.layers.76.mlp.experts.76.gate_proj", "model.layers.76.mlp.experts.77.gate_proj", "model.layers.76.mlp.experts.78.gate_proj", "model.layers.76.mlp.experts.79.gate_proj", "model.layers.76.mlp.experts.80.gate_proj", "model.layers.76.mlp.experts.81.gate_proj", "model.layers.76.mlp.experts.82.gate_proj", "model.layers.76.mlp.experts.83.gate_proj", "model.layers.76.mlp.experts.84.gate_proj", "model.layers.76.mlp.experts.85.gate_proj", "model.layers.76.mlp.experts.86.gate_proj", "model.layers.76.mlp.experts.87.gate_proj", "model.layers.76.mlp.experts.88.gate_proj", "model.layers.76.mlp.experts.89.gate_proj", "model.layers.76.mlp.experts.90.gate_proj", "model.layers.76.mlp.experts.91.gate_proj", "model.layers.76.mlp.experts.92.gate_proj", "model.layers.76.mlp.experts.93.gate_proj", "model.layers.76.mlp.experts.94.gate_proj", "model.layers.76.mlp.experts.95.gate_proj", "model.layers.76.mlp.experts.96.gate_proj", "model.layers.76.mlp.experts.97.gate_proj", "model.layers.76.mlp.experts.98.gate_proj", "model.layers.76.mlp.experts.99.gate_proj", "model.layers.76.mlp.experts.100.gate_proj", "model.layers.76.mlp.experts.101.gate_proj", "model.layers.76.mlp.experts.102.gate_proj", "model.layers.76.mlp.experts.103.gate_proj", "model.layers.76.mlp.experts.104.gate_proj", "model.layers.76.mlp.experts.105.gate_proj", "model.layers.76.mlp.experts.106.gate_proj", "model.layers.76.mlp.experts.107.gate_proj", "model.layers.76.mlp.experts.108.gate_proj", "model.layers.76.mlp.experts.109.gate_proj", "model.layers.76.mlp.experts.110.gate_proj", "model.layers.76.mlp.experts.111.gate_proj", "model.layers.76.mlp.experts.112.gate_proj", "model.layers.76.mlp.experts.113.gate_proj", "model.layers.76.mlp.experts.114.gate_proj", "model.layers.76.mlp.experts.115.gate_proj", "model.layers.76.mlp.experts.116.gate_proj", "model.layers.76.mlp.experts.117.gate_proj", "model.layers.76.mlp.experts.118.gate_proj", "model.layers.76.mlp.experts.119.gate_proj", "model.layers.76.mlp.experts.120.gate_proj", "model.layers.76.mlp.experts.121.gate_proj", "model.layers.76.mlp.experts.122.gate_proj", "model.layers.76.mlp.experts.123.gate_proj", "model.layers.76.mlp.experts.124.gate_proj", "model.layers.76.mlp.experts.125.gate_proj", "model.layers.76.mlp.experts.126.gate_proj", "model.layers.76.mlp.experts.127.gate_proj", "model.layers.76.mlp.experts.128.gate_proj", "model.layers.76.mlp.experts.129.gate_proj", "model.layers.76.mlp.experts.130.gate_proj", "model.layers.76.mlp.experts.131.gate_proj", "model.layers.76.mlp.experts.132.gate_proj", "model.layers.76.mlp.experts.133.gate_proj", "model.layers.76.mlp.experts.134.gate_proj", "model.layers.76.mlp.experts.135.gate_proj", "model.layers.76.mlp.experts.136.gate_proj", "model.layers.76.mlp.experts.137.gate_proj", "model.layers.76.mlp.experts.138.gate_proj", "model.layers.76.mlp.experts.139.gate_proj", "model.layers.76.mlp.experts.140.gate_proj", "model.layers.76.mlp.experts.141.gate_proj", "model.layers.76.mlp.experts.142.gate_proj", "model.layers.76.mlp.experts.143.gate_proj", "model.layers.76.mlp.experts.144.gate_proj", "model.layers.76.mlp.experts.145.gate_proj", "model.layers.76.mlp.experts.146.gate_proj", "model.layers.76.mlp.experts.147.gate_proj", "model.layers.76.mlp.experts.148.gate_proj", "model.layers.76.mlp.experts.149.gate_proj", "model.layers.76.mlp.experts.150.gate_proj", "model.layers.76.mlp.experts.151.gate_proj", "model.layers.76.mlp.experts.152.gate_proj", "model.layers.76.mlp.experts.153.gate_proj", "model.layers.76.mlp.experts.154.gate_proj", "model.layers.76.mlp.experts.155.gate_proj", "model.layers.76.mlp.experts.156.gate_proj", "model.layers.76.mlp.experts.157.gate_proj", "model.layers.76.mlp.experts.158.gate_proj", "model.layers.76.mlp.experts.159.gate_proj", "model.layers.76.mlp.experts.0.up_proj", "model.layers.76.mlp.experts.1.up_proj", "model.layers.76.mlp.experts.2.up_proj", "model.layers.76.mlp.experts.3.up_proj", "model.layers.76.mlp.experts.4.up_proj", "model.layers.76.mlp.experts.5.up_proj", "model.layers.76.mlp.experts.6.up_proj", "model.layers.76.mlp.experts.7.up_proj", "model.layers.76.mlp.experts.8.up_proj", "model.layers.76.mlp.experts.9.up_proj", "model.layers.76.mlp.experts.10.up_proj", "model.layers.76.mlp.experts.11.up_proj", "model.layers.76.mlp.experts.12.up_proj", "model.layers.76.mlp.experts.13.up_proj", "model.layers.76.mlp.experts.14.up_proj", "model.layers.76.mlp.experts.15.up_proj", "model.layers.76.mlp.experts.16.up_proj", "model.layers.76.mlp.experts.17.up_proj", "model.layers.76.mlp.experts.18.up_proj", "model.layers.76.mlp.experts.19.up_proj", "model.layers.76.mlp.experts.20.up_proj", "model.layers.76.mlp.experts.21.up_proj", "model.layers.76.mlp.experts.22.up_proj", "model.layers.76.mlp.experts.23.up_proj", "model.layers.76.mlp.experts.24.up_proj", "model.layers.76.mlp.experts.25.up_proj", "model.layers.76.mlp.experts.26.up_proj", "model.layers.76.mlp.experts.27.up_proj", "model.layers.76.mlp.experts.28.up_proj", "model.layers.76.mlp.experts.29.up_proj", "model.layers.76.mlp.experts.30.up_proj", "model.layers.76.mlp.experts.31.up_proj", "model.layers.76.mlp.experts.32.up_proj", "model.layers.76.mlp.experts.33.up_proj", "model.layers.76.mlp.experts.34.up_proj", "model.layers.76.mlp.experts.35.up_proj", "model.layers.76.mlp.experts.36.up_proj", "model.layers.76.mlp.experts.37.up_proj", "model.layers.76.mlp.experts.38.up_proj", "model.layers.76.mlp.experts.39.up_proj", "model.layers.76.mlp.experts.40.up_proj", "model.layers.76.mlp.experts.41.up_proj", "model.layers.76.mlp.experts.42.up_proj", "model.layers.76.mlp.experts.43.up_proj", "model.layers.76.mlp.experts.44.up_proj", "model.layers.76.mlp.experts.45.up_proj", "model.layers.76.mlp.experts.46.up_proj", "model.layers.76.mlp.experts.47.up_proj", "model.layers.76.mlp.experts.48.up_proj", "model.layers.76.mlp.experts.49.up_proj", "model.layers.76.mlp.experts.50.up_proj", "model.layers.76.mlp.experts.51.up_proj", "model.layers.76.mlp.experts.52.up_proj", "model.layers.76.mlp.experts.53.up_proj", "model.layers.76.mlp.experts.54.up_proj", "model.layers.76.mlp.experts.55.up_proj", "model.layers.76.mlp.experts.56.up_proj", "model.layers.76.mlp.experts.57.up_proj", "model.layers.76.mlp.experts.58.up_proj", "model.layers.76.mlp.experts.59.up_proj", "model.layers.76.mlp.experts.60.up_proj", "model.layers.76.mlp.experts.61.up_proj", "model.layers.76.mlp.experts.62.up_proj", "model.layers.76.mlp.experts.63.up_proj", "model.layers.76.mlp.experts.64.up_proj", "model.layers.76.mlp.experts.65.up_proj", "model.layers.76.mlp.experts.66.up_proj", "model.layers.76.mlp.experts.67.up_proj", "model.layers.76.mlp.experts.68.up_proj", "model.layers.76.mlp.experts.69.up_proj", "model.layers.76.mlp.experts.70.up_proj", "model.layers.76.mlp.experts.71.up_proj", "model.layers.76.mlp.experts.72.up_proj", "model.layers.76.mlp.experts.73.up_proj", "model.layers.76.mlp.experts.74.up_proj", "model.layers.76.mlp.experts.75.up_proj", "model.layers.76.mlp.experts.76.up_proj", "model.layers.76.mlp.experts.77.up_proj", "model.layers.76.mlp.experts.78.up_proj", "model.layers.76.mlp.experts.79.up_proj", "model.layers.76.mlp.experts.80.up_proj", "model.layers.76.mlp.experts.81.up_proj", "model.layers.76.mlp.experts.82.up_proj", "model.layers.76.mlp.experts.83.up_proj", "model.layers.76.mlp.experts.84.up_proj", "model.layers.76.mlp.experts.85.up_proj", "model.layers.76.mlp.experts.86.up_proj", "model.layers.76.mlp.experts.87.up_proj", "model.layers.76.mlp.experts.88.up_proj", "model.layers.76.mlp.experts.89.up_proj", "model.layers.76.mlp.experts.90.up_proj", "model.layers.76.mlp.experts.91.up_proj", "model.layers.76.mlp.experts.92.up_proj", "model.layers.76.mlp.experts.93.up_proj", "model.layers.76.mlp.experts.94.up_proj", "model.layers.76.mlp.experts.95.up_proj", "model.layers.76.mlp.experts.96.up_proj", "model.layers.76.mlp.experts.97.up_proj", "model.layers.76.mlp.experts.98.up_proj", "model.layers.76.mlp.experts.99.up_proj", "model.layers.76.mlp.experts.100.up_proj", "model.layers.76.mlp.experts.101.up_proj", "model.layers.76.mlp.experts.102.up_proj", "model.layers.76.mlp.experts.103.up_proj", "model.layers.76.mlp.experts.104.up_proj", "model.layers.76.mlp.experts.105.up_proj", "model.layers.76.mlp.experts.106.up_proj", "model.layers.76.mlp.experts.107.up_proj", "model.layers.76.mlp.experts.108.up_proj", "model.layers.76.mlp.experts.109.up_proj", "model.layers.76.mlp.experts.110.up_proj", "model.layers.76.mlp.experts.111.up_proj", "model.layers.76.mlp.experts.112.up_proj", "model.layers.76.mlp.experts.113.up_proj", "model.layers.76.mlp.experts.114.up_proj", "model.layers.76.mlp.experts.115.up_proj", "model.layers.76.mlp.experts.116.up_proj", "model.layers.76.mlp.experts.117.up_proj", "model.layers.76.mlp.experts.118.up_proj", "model.layers.76.mlp.experts.119.up_proj", "model.layers.76.mlp.experts.120.up_proj", "model.layers.76.mlp.experts.121.up_proj", "model.layers.76.mlp.experts.122.up_proj", "model.layers.76.mlp.experts.123.up_proj", "model.layers.76.mlp.experts.124.up_proj", "model.layers.76.mlp.experts.125.up_proj", "model.layers.76.mlp.experts.126.up_proj", "model.layers.76.mlp.experts.127.up_proj", "model.layers.76.mlp.experts.128.up_proj", "model.layers.76.mlp.experts.129.up_proj", "model.layers.76.mlp.experts.130.up_proj", "model.layers.76.mlp.experts.131.up_proj", "model.layers.76.mlp.experts.132.up_proj", "model.layers.76.mlp.experts.133.up_proj", "model.layers.76.mlp.experts.134.up_proj", "model.layers.76.mlp.experts.135.up_proj", "model.layers.76.mlp.experts.136.up_proj", "model.layers.76.mlp.experts.137.up_proj", "model.layers.76.mlp.experts.138.up_proj", "model.layers.76.mlp.experts.139.up_proj", "model.layers.76.mlp.experts.140.up_proj", "model.layers.76.mlp.experts.141.up_proj", "model.layers.76.mlp.experts.142.up_proj", "model.layers.76.mlp.experts.143.up_proj", "model.layers.76.mlp.experts.144.up_proj", "model.layers.76.mlp.experts.145.up_proj", "model.layers.76.mlp.experts.146.up_proj", "model.layers.76.mlp.experts.147.up_proj", "model.layers.76.mlp.experts.148.up_proj", "model.layers.76.mlp.experts.149.up_proj", "model.layers.76.mlp.experts.150.up_proj", "model.layers.76.mlp.experts.151.up_proj", "model.layers.76.mlp.experts.152.up_proj", "model.layers.76.mlp.experts.153.up_proj", "model.layers.76.mlp.experts.154.up_proj", "model.layers.76.mlp.experts.155.up_proj", "model.layers.76.mlp.experts.156.up_proj", "model.layers.76.mlp.experts.157.up_proj", "model.layers.76.mlp.experts.158.up_proj", "model.layers.76.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -2.3342575877903504e-05, "dbits": 2516582400 }, { "dkld": -2.2314419038592728e-05, "dbits": 5033164800 } ] }, { "idx": 458, "layers": [ "model.layers.76.mlp.experts.0.down_proj", "model.layers.76.mlp.experts.1.down_proj", "model.layers.76.mlp.experts.2.down_proj", "model.layers.76.mlp.experts.3.down_proj", "model.layers.76.mlp.experts.4.down_proj", "model.layers.76.mlp.experts.5.down_proj", "model.layers.76.mlp.experts.6.down_proj", "model.layers.76.mlp.experts.7.down_proj", "model.layers.76.mlp.experts.8.down_proj", "model.layers.76.mlp.experts.9.down_proj", "model.layers.76.mlp.experts.10.down_proj", "model.layers.76.mlp.experts.11.down_proj", "model.layers.76.mlp.experts.12.down_proj", "model.layers.76.mlp.experts.13.down_proj", "model.layers.76.mlp.experts.14.down_proj", "model.layers.76.mlp.experts.15.down_proj", "model.layers.76.mlp.experts.16.down_proj", "model.layers.76.mlp.experts.17.down_proj", "model.layers.76.mlp.experts.18.down_proj", "model.layers.76.mlp.experts.19.down_proj", "model.layers.76.mlp.experts.20.down_proj", "model.layers.76.mlp.experts.21.down_proj", "model.layers.76.mlp.experts.22.down_proj", "model.layers.76.mlp.experts.23.down_proj", "model.layers.76.mlp.experts.24.down_proj", "model.layers.76.mlp.experts.25.down_proj", "model.layers.76.mlp.experts.26.down_proj", "model.layers.76.mlp.experts.27.down_proj", "model.layers.76.mlp.experts.28.down_proj", "model.layers.76.mlp.experts.29.down_proj", "model.layers.76.mlp.experts.30.down_proj", "model.layers.76.mlp.experts.31.down_proj", "model.layers.76.mlp.experts.32.down_proj", "model.layers.76.mlp.experts.33.down_proj", "model.layers.76.mlp.experts.34.down_proj", "model.layers.76.mlp.experts.35.down_proj", "model.layers.76.mlp.experts.36.down_proj", "model.layers.76.mlp.experts.37.down_proj", "model.layers.76.mlp.experts.38.down_proj", "model.layers.76.mlp.experts.39.down_proj", "model.layers.76.mlp.experts.40.down_proj", "model.layers.76.mlp.experts.41.down_proj", "model.layers.76.mlp.experts.42.down_proj", "model.layers.76.mlp.experts.43.down_proj", "model.layers.76.mlp.experts.44.down_proj", "model.layers.76.mlp.experts.45.down_proj", "model.layers.76.mlp.experts.46.down_proj", "model.layers.76.mlp.experts.47.down_proj", "model.layers.76.mlp.experts.48.down_proj", "model.layers.76.mlp.experts.49.down_proj", "model.layers.76.mlp.experts.50.down_proj", "model.layers.76.mlp.experts.51.down_proj", "model.layers.76.mlp.experts.52.down_proj", "model.layers.76.mlp.experts.53.down_proj", "model.layers.76.mlp.experts.54.down_proj", "model.layers.76.mlp.experts.55.down_proj", "model.layers.76.mlp.experts.56.down_proj", "model.layers.76.mlp.experts.57.down_proj", "model.layers.76.mlp.experts.58.down_proj", "model.layers.76.mlp.experts.59.down_proj", "model.layers.76.mlp.experts.60.down_proj", "model.layers.76.mlp.experts.61.down_proj", "model.layers.76.mlp.experts.62.down_proj", "model.layers.76.mlp.experts.63.down_proj", "model.layers.76.mlp.experts.64.down_proj", "model.layers.76.mlp.experts.65.down_proj", "model.layers.76.mlp.experts.66.down_proj", "model.layers.76.mlp.experts.67.down_proj", "model.layers.76.mlp.experts.68.down_proj", "model.layers.76.mlp.experts.69.down_proj", "model.layers.76.mlp.experts.70.down_proj", "model.layers.76.mlp.experts.71.down_proj", "model.layers.76.mlp.experts.72.down_proj", "model.layers.76.mlp.experts.73.down_proj", "model.layers.76.mlp.experts.74.down_proj", "model.layers.76.mlp.experts.75.down_proj", "model.layers.76.mlp.experts.76.down_proj", "model.layers.76.mlp.experts.77.down_proj", "model.layers.76.mlp.experts.78.down_proj", "model.layers.76.mlp.experts.79.down_proj", "model.layers.76.mlp.experts.80.down_proj", "model.layers.76.mlp.experts.81.down_proj", "model.layers.76.mlp.experts.82.down_proj", "model.layers.76.mlp.experts.83.down_proj", "model.layers.76.mlp.experts.84.down_proj", "model.layers.76.mlp.experts.85.down_proj", "model.layers.76.mlp.experts.86.down_proj", "model.layers.76.mlp.experts.87.down_proj", "model.layers.76.mlp.experts.88.down_proj", "model.layers.76.mlp.experts.89.down_proj", "model.layers.76.mlp.experts.90.down_proj", "model.layers.76.mlp.experts.91.down_proj", "model.layers.76.mlp.experts.92.down_proj", "model.layers.76.mlp.experts.93.down_proj", "model.layers.76.mlp.experts.94.down_proj", "model.layers.76.mlp.experts.95.down_proj", "model.layers.76.mlp.experts.96.down_proj", "model.layers.76.mlp.experts.97.down_proj", "model.layers.76.mlp.experts.98.down_proj", "model.layers.76.mlp.experts.99.down_proj", "model.layers.76.mlp.experts.100.down_proj", "model.layers.76.mlp.experts.101.down_proj", "model.layers.76.mlp.experts.102.down_proj", "model.layers.76.mlp.experts.103.down_proj", "model.layers.76.mlp.experts.104.down_proj", "model.layers.76.mlp.experts.105.down_proj", "model.layers.76.mlp.experts.106.down_proj", "model.layers.76.mlp.experts.107.down_proj", "model.layers.76.mlp.experts.108.down_proj", "model.layers.76.mlp.experts.109.down_proj", "model.layers.76.mlp.experts.110.down_proj", "model.layers.76.mlp.experts.111.down_proj", "model.layers.76.mlp.experts.112.down_proj", "model.layers.76.mlp.experts.113.down_proj", "model.layers.76.mlp.experts.114.down_proj", "model.layers.76.mlp.experts.115.down_proj", "model.layers.76.mlp.experts.116.down_proj", "model.layers.76.mlp.experts.117.down_proj", "model.layers.76.mlp.experts.118.down_proj", "model.layers.76.mlp.experts.119.down_proj", "model.layers.76.mlp.experts.120.down_proj", "model.layers.76.mlp.experts.121.down_proj", "model.layers.76.mlp.experts.122.down_proj", "model.layers.76.mlp.experts.123.down_proj", "model.layers.76.mlp.experts.124.down_proj", "model.layers.76.mlp.experts.125.down_proj", "model.layers.76.mlp.experts.126.down_proj", "model.layers.76.mlp.experts.127.down_proj", "model.layers.76.mlp.experts.128.down_proj", "model.layers.76.mlp.experts.129.down_proj", "model.layers.76.mlp.experts.130.down_proj", "model.layers.76.mlp.experts.131.down_proj", "model.layers.76.mlp.experts.132.down_proj", "model.layers.76.mlp.experts.133.down_proj", "model.layers.76.mlp.experts.134.down_proj", "model.layers.76.mlp.experts.135.down_proj", "model.layers.76.mlp.experts.136.down_proj", "model.layers.76.mlp.experts.137.down_proj", "model.layers.76.mlp.experts.138.down_proj", "model.layers.76.mlp.experts.139.down_proj", "model.layers.76.mlp.experts.140.down_proj", "model.layers.76.mlp.experts.141.down_proj", "model.layers.76.mlp.experts.142.down_proj", "model.layers.76.mlp.experts.143.down_proj", "model.layers.76.mlp.experts.144.down_proj", "model.layers.76.mlp.experts.145.down_proj", "model.layers.76.mlp.experts.146.down_proj", "model.layers.76.mlp.experts.147.down_proj", "model.layers.76.mlp.experts.148.down_proj", "model.layers.76.mlp.experts.149.down_proj", "model.layers.76.mlp.experts.150.down_proj", "model.layers.76.mlp.experts.151.down_proj", "model.layers.76.mlp.experts.152.down_proj", "model.layers.76.mlp.experts.153.down_proj", "model.layers.76.mlp.experts.154.down_proj", "model.layers.76.mlp.experts.155.down_proj", "model.layers.76.mlp.experts.156.down_proj", "model.layers.76.mlp.experts.157.down_proj", "model.layers.76.mlp.experts.158.down_proj", "model.layers.76.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.9357074052095413e-05, "dbits": 1258291200 }, { "dkld": 2.688961103572418e-07, "dbits": 2516582400 } ] }, { "idx": 459, "layers": [ "model.layers.77.self_attn.q_proj" ], "candidates": [ { "dkld": -2.130351494997705e-05, "dbits": 62914560 }, { "dkld": -3.3774226903914364e-05, "dbits": 125829120 } ] }, { "idx": 460, "layers": [ "model.layers.77.self_attn.k_proj", "model.layers.77.self_attn.v_proj" ], "candidates": [ { "dkld": -7.406082004308631e-05, "dbits": 10485760 }, { "dkld": -6.528683006763389e-05, "dbits": 20971520 } ] }, { "idx": 461, "layers": [ "model.layers.77.self_attn.o_proj" ], "candidates": [ { "dkld": -1.3834214769303799e-05, "dbits": 62914560 }, { "dkld": -1.9877310842275273e-05, "dbits": 125829120 } ] }, { "idx": 462, "layers": [ "model.layers.77.mlp.shared_experts.gate_proj", "model.layers.77.mlp.shared_experts.up_proj", "model.layers.77.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -1.7036427743732582e-05, "dbits": 23592960 }, { "dkld": 2.8679147362709045e-05, "dbits": 47185920 } ] }, { "idx": 463, "layers": [ "model.layers.77.mlp.experts.0.gate_proj", "model.layers.77.mlp.experts.1.gate_proj", "model.layers.77.mlp.experts.2.gate_proj", "model.layers.77.mlp.experts.3.gate_proj", "model.layers.77.mlp.experts.4.gate_proj", "model.layers.77.mlp.experts.5.gate_proj", "model.layers.77.mlp.experts.6.gate_proj", "model.layers.77.mlp.experts.7.gate_proj", "model.layers.77.mlp.experts.8.gate_proj", "model.layers.77.mlp.experts.9.gate_proj", "model.layers.77.mlp.experts.10.gate_proj", "model.layers.77.mlp.experts.11.gate_proj", "model.layers.77.mlp.experts.12.gate_proj", "model.layers.77.mlp.experts.13.gate_proj", "model.layers.77.mlp.experts.14.gate_proj", "model.layers.77.mlp.experts.15.gate_proj", "model.layers.77.mlp.experts.16.gate_proj", "model.layers.77.mlp.experts.17.gate_proj", "model.layers.77.mlp.experts.18.gate_proj", "model.layers.77.mlp.experts.19.gate_proj", "model.layers.77.mlp.experts.20.gate_proj", "model.layers.77.mlp.experts.21.gate_proj", "model.layers.77.mlp.experts.22.gate_proj", "model.layers.77.mlp.experts.23.gate_proj", "model.layers.77.mlp.experts.24.gate_proj", "model.layers.77.mlp.experts.25.gate_proj", "model.layers.77.mlp.experts.26.gate_proj", "model.layers.77.mlp.experts.27.gate_proj", "model.layers.77.mlp.experts.28.gate_proj", "model.layers.77.mlp.experts.29.gate_proj", "model.layers.77.mlp.experts.30.gate_proj", "model.layers.77.mlp.experts.31.gate_proj", "model.layers.77.mlp.experts.32.gate_proj", "model.layers.77.mlp.experts.33.gate_proj", "model.layers.77.mlp.experts.34.gate_proj", "model.layers.77.mlp.experts.35.gate_proj", "model.layers.77.mlp.experts.36.gate_proj", "model.layers.77.mlp.experts.37.gate_proj", "model.layers.77.mlp.experts.38.gate_proj", "model.layers.77.mlp.experts.39.gate_proj", "model.layers.77.mlp.experts.40.gate_proj", "model.layers.77.mlp.experts.41.gate_proj", "model.layers.77.mlp.experts.42.gate_proj", "model.layers.77.mlp.experts.43.gate_proj", "model.layers.77.mlp.experts.44.gate_proj", "model.layers.77.mlp.experts.45.gate_proj", "model.layers.77.mlp.experts.46.gate_proj", "model.layers.77.mlp.experts.47.gate_proj", "model.layers.77.mlp.experts.48.gate_proj", "model.layers.77.mlp.experts.49.gate_proj", "model.layers.77.mlp.experts.50.gate_proj", "model.layers.77.mlp.experts.51.gate_proj", "model.layers.77.mlp.experts.52.gate_proj", "model.layers.77.mlp.experts.53.gate_proj", "model.layers.77.mlp.experts.54.gate_proj", "model.layers.77.mlp.experts.55.gate_proj", "model.layers.77.mlp.experts.56.gate_proj", "model.layers.77.mlp.experts.57.gate_proj", "model.layers.77.mlp.experts.58.gate_proj", "model.layers.77.mlp.experts.59.gate_proj", "model.layers.77.mlp.experts.60.gate_proj", "model.layers.77.mlp.experts.61.gate_proj", "model.layers.77.mlp.experts.62.gate_proj", "model.layers.77.mlp.experts.63.gate_proj", "model.layers.77.mlp.experts.64.gate_proj", "model.layers.77.mlp.experts.65.gate_proj", "model.layers.77.mlp.experts.66.gate_proj", "model.layers.77.mlp.experts.67.gate_proj", "model.layers.77.mlp.experts.68.gate_proj", "model.layers.77.mlp.experts.69.gate_proj", "model.layers.77.mlp.experts.70.gate_proj", "model.layers.77.mlp.experts.71.gate_proj", "model.layers.77.mlp.experts.72.gate_proj", "model.layers.77.mlp.experts.73.gate_proj", "model.layers.77.mlp.experts.74.gate_proj", "model.layers.77.mlp.experts.75.gate_proj", "model.layers.77.mlp.experts.76.gate_proj", "model.layers.77.mlp.experts.77.gate_proj", "model.layers.77.mlp.experts.78.gate_proj", "model.layers.77.mlp.experts.79.gate_proj", "model.layers.77.mlp.experts.80.gate_proj", "model.layers.77.mlp.experts.81.gate_proj", "model.layers.77.mlp.experts.82.gate_proj", "model.layers.77.mlp.experts.83.gate_proj", "model.layers.77.mlp.experts.84.gate_proj", "model.layers.77.mlp.experts.85.gate_proj", "model.layers.77.mlp.experts.86.gate_proj", "model.layers.77.mlp.experts.87.gate_proj", "model.layers.77.mlp.experts.88.gate_proj", "model.layers.77.mlp.experts.89.gate_proj", "model.layers.77.mlp.experts.90.gate_proj", "model.layers.77.mlp.experts.91.gate_proj", "model.layers.77.mlp.experts.92.gate_proj", "model.layers.77.mlp.experts.93.gate_proj", "model.layers.77.mlp.experts.94.gate_proj", "model.layers.77.mlp.experts.95.gate_proj", "model.layers.77.mlp.experts.96.gate_proj", "model.layers.77.mlp.experts.97.gate_proj", "model.layers.77.mlp.experts.98.gate_proj", "model.layers.77.mlp.experts.99.gate_proj", "model.layers.77.mlp.experts.100.gate_proj", "model.layers.77.mlp.experts.101.gate_proj", "model.layers.77.mlp.experts.102.gate_proj", "model.layers.77.mlp.experts.103.gate_proj", "model.layers.77.mlp.experts.104.gate_proj", "model.layers.77.mlp.experts.105.gate_proj", "model.layers.77.mlp.experts.106.gate_proj", "model.layers.77.mlp.experts.107.gate_proj", "model.layers.77.mlp.experts.108.gate_proj", "model.layers.77.mlp.experts.109.gate_proj", "model.layers.77.mlp.experts.110.gate_proj", "model.layers.77.mlp.experts.111.gate_proj", "model.layers.77.mlp.experts.112.gate_proj", "model.layers.77.mlp.experts.113.gate_proj", "model.layers.77.mlp.experts.114.gate_proj", "model.layers.77.mlp.experts.115.gate_proj", "model.layers.77.mlp.experts.116.gate_proj", "model.layers.77.mlp.experts.117.gate_proj", "model.layers.77.mlp.experts.118.gate_proj", "model.layers.77.mlp.experts.119.gate_proj", "model.layers.77.mlp.experts.120.gate_proj", "model.layers.77.mlp.experts.121.gate_proj", "model.layers.77.mlp.experts.122.gate_proj", "model.layers.77.mlp.experts.123.gate_proj", "model.layers.77.mlp.experts.124.gate_proj", "model.layers.77.mlp.experts.125.gate_proj", "model.layers.77.mlp.experts.126.gate_proj", "model.layers.77.mlp.experts.127.gate_proj", "model.layers.77.mlp.experts.128.gate_proj", "model.layers.77.mlp.experts.129.gate_proj", "model.layers.77.mlp.experts.130.gate_proj", "model.layers.77.mlp.experts.131.gate_proj", "model.layers.77.mlp.experts.132.gate_proj", "model.layers.77.mlp.experts.133.gate_proj", "model.layers.77.mlp.experts.134.gate_proj", "model.layers.77.mlp.experts.135.gate_proj", "model.layers.77.mlp.experts.136.gate_proj", "model.layers.77.mlp.experts.137.gate_proj", "model.layers.77.mlp.experts.138.gate_proj", "model.layers.77.mlp.experts.139.gate_proj", "model.layers.77.mlp.experts.140.gate_proj", "model.layers.77.mlp.experts.141.gate_proj", "model.layers.77.mlp.experts.142.gate_proj", "model.layers.77.mlp.experts.143.gate_proj", "model.layers.77.mlp.experts.144.gate_proj", "model.layers.77.mlp.experts.145.gate_proj", "model.layers.77.mlp.experts.146.gate_proj", "model.layers.77.mlp.experts.147.gate_proj", "model.layers.77.mlp.experts.148.gate_proj", "model.layers.77.mlp.experts.149.gate_proj", "model.layers.77.mlp.experts.150.gate_proj", "model.layers.77.mlp.experts.151.gate_proj", "model.layers.77.mlp.experts.152.gate_proj", "model.layers.77.mlp.experts.153.gate_proj", "model.layers.77.mlp.experts.154.gate_proj", "model.layers.77.mlp.experts.155.gate_proj", "model.layers.77.mlp.experts.156.gate_proj", "model.layers.77.mlp.experts.157.gate_proj", "model.layers.77.mlp.experts.158.gate_proj", "model.layers.77.mlp.experts.159.gate_proj", "model.layers.77.mlp.experts.0.up_proj", "model.layers.77.mlp.experts.1.up_proj", "model.layers.77.mlp.experts.2.up_proj", "model.layers.77.mlp.experts.3.up_proj", "model.layers.77.mlp.experts.4.up_proj", "model.layers.77.mlp.experts.5.up_proj", "model.layers.77.mlp.experts.6.up_proj", "model.layers.77.mlp.experts.7.up_proj", "model.layers.77.mlp.experts.8.up_proj", "model.layers.77.mlp.experts.9.up_proj", "model.layers.77.mlp.experts.10.up_proj", "model.layers.77.mlp.experts.11.up_proj", "model.layers.77.mlp.experts.12.up_proj", "model.layers.77.mlp.experts.13.up_proj", "model.layers.77.mlp.experts.14.up_proj", "model.layers.77.mlp.experts.15.up_proj", "model.layers.77.mlp.experts.16.up_proj", "model.layers.77.mlp.experts.17.up_proj", "model.layers.77.mlp.experts.18.up_proj", "model.layers.77.mlp.experts.19.up_proj", "model.layers.77.mlp.experts.20.up_proj", "model.layers.77.mlp.experts.21.up_proj", "model.layers.77.mlp.experts.22.up_proj", "model.layers.77.mlp.experts.23.up_proj", "model.layers.77.mlp.experts.24.up_proj", "model.layers.77.mlp.experts.25.up_proj", "model.layers.77.mlp.experts.26.up_proj", "model.layers.77.mlp.experts.27.up_proj", "model.layers.77.mlp.experts.28.up_proj", "model.layers.77.mlp.experts.29.up_proj", "model.layers.77.mlp.experts.30.up_proj", "model.layers.77.mlp.experts.31.up_proj", "model.layers.77.mlp.experts.32.up_proj", "model.layers.77.mlp.experts.33.up_proj", "model.layers.77.mlp.experts.34.up_proj", "model.layers.77.mlp.experts.35.up_proj", "model.layers.77.mlp.experts.36.up_proj", "model.layers.77.mlp.experts.37.up_proj", "model.layers.77.mlp.experts.38.up_proj", "model.layers.77.mlp.experts.39.up_proj", "model.layers.77.mlp.experts.40.up_proj", "model.layers.77.mlp.experts.41.up_proj", "model.layers.77.mlp.experts.42.up_proj", "model.layers.77.mlp.experts.43.up_proj", "model.layers.77.mlp.experts.44.up_proj", "model.layers.77.mlp.experts.45.up_proj", "model.layers.77.mlp.experts.46.up_proj", "model.layers.77.mlp.experts.47.up_proj", "model.layers.77.mlp.experts.48.up_proj", "model.layers.77.mlp.experts.49.up_proj", "model.layers.77.mlp.experts.50.up_proj", "model.layers.77.mlp.experts.51.up_proj", "model.layers.77.mlp.experts.52.up_proj", "model.layers.77.mlp.experts.53.up_proj", "model.layers.77.mlp.experts.54.up_proj", "model.layers.77.mlp.experts.55.up_proj", "model.layers.77.mlp.experts.56.up_proj", "model.layers.77.mlp.experts.57.up_proj", "model.layers.77.mlp.experts.58.up_proj", "model.layers.77.mlp.experts.59.up_proj", "model.layers.77.mlp.experts.60.up_proj", "model.layers.77.mlp.experts.61.up_proj", "model.layers.77.mlp.experts.62.up_proj", "model.layers.77.mlp.experts.63.up_proj", "model.layers.77.mlp.experts.64.up_proj", "model.layers.77.mlp.experts.65.up_proj", "model.layers.77.mlp.experts.66.up_proj", "model.layers.77.mlp.experts.67.up_proj", "model.layers.77.mlp.experts.68.up_proj", "model.layers.77.mlp.experts.69.up_proj", "model.layers.77.mlp.experts.70.up_proj", "model.layers.77.mlp.experts.71.up_proj", "model.layers.77.mlp.experts.72.up_proj", "model.layers.77.mlp.experts.73.up_proj", "model.layers.77.mlp.experts.74.up_proj", "model.layers.77.mlp.experts.75.up_proj", "model.layers.77.mlp.experts.76.up_proj", "model.layers.77.mlp.experts.77.up_proj", "model.layers.77.mlp.experts.78.up_proj", "model.layers.77.mlp.experts.79.up_proj", "model.layers.77.mlp.experts.80.up_proj", "model.layers.77.mlp.experts.81.up_proj", "model.layers.77.mlp.experts.82.up_proj", "model.layers.77.mlp.experts.83.up_proj", "model.layers.77.mlp.experts.84.up_proj", "model.layers.77.mlp.experts.85.up_proj", "model.layers.77.mlp.experts.86.up_proj", "model.layers.77.mlp.experts.87.up_proj", "model.layers.77.mlp.experts.88.up_proj", "model.layers.77.mlp.experts.89.up_proj", "model.layers.77.mlp.experts.90.up_proj", "model.layers.77.mlp.experts.91.up_proj", "model.layers.77.mlp.experts.92.up_proj", "model.layers.77.mlp.experts.93.up_proj", "model.layers.77.mlp.experts.94.up_proj", "model.layers.77.mlp.experts.95.up_proj", "model.layers.77.mlp.experts.96.up_proj", "model.layers.77.mlp.experts.97.up_proj", "model.layers.77.mlp.experts.98.up_proj", "model.layers.77.mlp.experts.99.up_proj", "model.layers.77.mlp.experts.100.up_proj", "model.layers.77.mlp.experts.101.up_proj", "model.layers.77.mlp.experts.102.up_proj", "model.layers.77.mlp.experts.103.up_proj", "model.layers.77.mlp.experts.104.up_proj", "model.layers.77.mlp.experts.105.up_proj", "model.layers.77.mlp.experts.106.up_proj", "model.layers.77.mlp.experts.107.up_proj", "model.layers.77.mlp.experts.108.up_proj", "model.layers.77.mlp.experts.109.up_proj", "model.layers.77.mlp.experts.110.up_proj", "model.layers.77.mlp.experts.111.up_proj", "model.layers.77.mlp.experts.112.up_proj", "model.layers.77.mlp.experts.113.up_proj", "model.layers.77.mlp.experts.114.up_proj", "model.layers.77.mlp.experts.115.up_proj", "model.layers.77.mlp.experts.116.up_proj", "model.layers.77.mlp.experts.117.up_proj", "model.layers.77.mlp.experts.118.up_proj", "model.layers.77.mlp.experts.119.up_proj", "model.layers.77.mlp.experts.120.up_proj", "model.layers.77.mlp.experts.121.up_proj", "model.layers.77.mlp.experts.122.up_proj", "model.layers.77.mlp.experts.123.up_proj", "model.layers.77.mlp.experts.124.up_proj", "model.layers.77.mlp.experts.125.up_proj", "model.layers.77.mlp.experts.126.up_proj", "model.layers.77.mlp.experts.127.up_proj", "model.layers.77.mlp.experts.128.up_proj", "model.layers.77.mlp.experts.129.up_proj", "model.layers.77.mlp.experts.130.up_proj", "model.layers.77.mlp.experts.131.up_proj", "model.layers.77.mlp.experts.132.up_proj", "model.layers.77.mlp.experts.133.up_proj", "model.layers.77.mlp.experts.134.up_proj", "model.layers.77.mlp.experts.135.up_proj", "model.layers.77.mlp.experts.136.up_proj", "model.layers.77.mlp.experts.137.up_proj", "model.layers.77.mlp.experts.138.up_proj", "model.layers.77.mlp.experts.139.up_proj", "model.layers.77.mlp.experts.140.up_proj", "model.layers.77.mlp.experts.141.up_proj", "model.layers.77.mlp.experts.142.up_proj", "model.layers.77.mlp.experts.143.up_proj", "model.layers.77.mlp.experts.144.up_proj", "model.layers.77.mlp.experts.145.up_proj", "model.layers.77.mlp.experts.146.up_proj", "model.layers.77.mlp.experts.147.up_proj", "model.layers.77.mlp.experts.148.up_proj", "model.layers.77.mlp.experts.149.up_proj", "model.layers.77.mlp.experts.150.up_proj", "model.layers.77.mlp.experts.151.up_proj", "model.layers.77.mlp.experts.152.up_proj", "model.layers.77.mlp.experts.153.up_proj", "model.layers.77.mlp.experts.154.up_proj", "model.layers.77.mlp.experts.155.up_proj", "model.layers.77.mlp.experts.156.up_proj", "model.layers.77.mlp.experts.157.up_proj", "model.layers.77.mlp.experts.158.up_proj", "model.layers.77.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -5.8771809563033794e-06, "dbits": 2516582400 }, { "dkld": -6.166752427802513e-07, "dbits": 5033164800 } ] }, { "idx": 464, "layers": [ "model.layers.77.mlp.experts.0.down_proj", "model.layers.77.mlp.experts.1.down_proj", "model.layers.77.mlp.experts.2.down_proj", "model.layers.77.mlp.experts.3.down_proj", "model.layers.77.mlp.experts.4.down_proj", "model.layers.77.mlp.experts.5.down_proj", "model.layers.77.mlp.experts.6.down_proj", "model.layers.77.mlp.experts.7.down_proj", "model.layers.77.mlp.experts.8.down_proj", "model.layers.77.mlp.experts.9.down_proj", "model.layers.77.mlp.experts.10.down_proj", "model.layers.77.mlp.experts.11.down_proj", "model.layers.77.mlp.experts.12.down_proj", "model.layers.77.mlp.experts.13.down_proj", "model.layers.77.mlp.experts.14.down_proj", "model.layers.77.mlp.experts.15.down_proj", "model.layers.77.mlp.experts.16.down_proj", "model.layers.77.mlp.experts.17.down_proj", "model.layers.77.mlp.experts.18.down_proj", "model.layers.77.mlp.experts.19.down_proj", "model.layers.77.mlp.experts.20.down_proj", "model.layers.77.mlp.experts.21.down_proj", "model.layers.77.mlp.experts.22.down_proj", "model.layers.77.mlp.experts.23.down_proj", "model.layers.77.mlp.experts.24.down_proj", "model.layers.77.mlp.experts.25.down_proj", "model.layers.77.mlp.experts.26.down_proj", "model.layers.77.mlp.experts.27.down_proj", "model.layers.77.mlp.experts.28.down_proj", "model.layers.77.mlp.experts.29.down_proj", "model.layers.77.mlp.experts.30.down_proj", "model.layers.77.mlp.experts.31.down_proj", "model.layers.77.mlp.experts.32.down_proj", "model.layers.77.mlp.experts.33.down_proj", "model.layers.77.mlp.experts.34.down_proj", "model.layers.77.mlp.experts.35.down_proj", "model.layers.77.mlp.experts.36.down_proj", "model.layers.77.mlp.experts.37.down_proj", "model.layers.77.mlp.experts.38.down_proj", "model.layers.77.mlp.experts.39.down_proj", "model.layers.77.mlp.experts.40.down_proj", "model.layers.77.mlp.experts.41.down_proj", "model.layers.77.mlp.experts.42.down_proj", "model.layers.77.mlp.experts.43.down_proj", "model.layers.77.mlp.experts.44.down_proj", "model.layers.77.mlp.experts.45.down_proj", "model.layers.77.mlp.experts.46.down_proj", "model.layers.77.mlp.experts.47.down_proj", "model.layers.77.mlp.experts.48.down_proj", "model.layers.77.mlp.experts.49.down_proj", "model.layers.77.mlp.experts.50.down_proj", "model.layers.77.mlp.experts.51.down_proj", "model.layers.77.mlp.experts.52.down_proj", "model.layers.77.mlp.experts.53.down_proj", "model.layers.77.mlp.experts.54.down_proj", "model.layers.77.mlp.experts.55.down_proj", "model.layers.77.mlp.experts.56.down_proj", "model.layers.77.mlp.experts.57.down_proj", "model.layers.77.mlp.experts.58.down_proj", "model.layers.77.mlp.experts.59.down_proj", "model.layers.77.mlp.experts.60.down_proj", "model.layers.77.mlp.experts.61.down_proj", "model.layers.77.mlp.experts.62.down_proj", "model.layers.77.mlp.experts.63.down_proj", "model.layers.77.mlp.experts.64.down_proj", "model.layers.77.mlp.experts.65.down_proj", "model.layers.77.mlp.experts.66.down_proj", "model.layers.77.mlp.experts.67.down_proj", "model.layers.77.mlp.experts.68.down_proj", "model.layers.77.mlp.experts.69.down_proj", "model.layers.77.mlp.experts.70.down_proj", "model.layers.77.mlp.experts.71.down_proj", "model.layers.77.mlp.experts.72.down_proj", "model.layers.77.mlp.experts.73.down_proj", "model.layers.77.mlp.experts.74.down_proj", "model.layers.77.mlp.experts.75.down_proj", "model.layers.77.mlp.experts.76.down_proj", "model.layers.77.mlp.experts.77.down_proj", "model.layers.77.mlp.experts.78.down_proj", "model.layers.77.mlp.experts.79.down_proj", "model.layers.77.mlp.experts.80.down_proj", "model.layers.77.mlp.experts.81.down_proj", "model.layers.77.mlp.experts.82.down_proj", "model.layers.77.mlp.experts.83.down_proj", "model.layers.77.mlp.experts.84.down_proj", "model.layers.77.mlp.experts.85.down_proj", "model.layers.77.mlp.experts.86.down_proj", "model.layers.77.mlp.experts.87.down_proj", "model.layers.77.mlp.experts.88.down_proj", "model.layers.77.mlp.experts.89.down_proj", "model.layers.77.mlp.experts.90.down_proj", "model.layers.77.mlp.experts.91.down_proj", "model.layers.77.mlp.experts.92.down_proj", "model.layers.77.mlp.experts.93.down_proj", "model.layers.77.mlp.experts.94.down_proj", "model.layers.77.mlp.experts.95.down_proj", "model.layers.77.mlp.experts.96.down_proj", "model.layers.77.mlp.experts.97.down_proj", "model.layers.77.mlp.experts.98.down_proj", "model.layers.77.mlp.experts.99.down_proj", "model.layers.77.mlp.experts.100.down_proj", "model.layers.77.mlp.experts.101.down_proj", "model.layers.77.mlp.experts.102.down_proj", "model.layers.77.mlp.experts.103.down_proj", "model.layers.77.mlp.experts.104.down_proj", "model.layers.77.mlp.experts.105.down_proj", "model.layers.77.mlp.experts.106.down_proj", "model.layers.77.mlp.experts.107.down_proj", "model.layers.77.mlp.experts.108.down_proj", "model.layers.77.mlp.experts.109.down_proj", "model.layers.77.mlp.experts.110.down_proj", "model.layers.77.mlp.experts.111.down_proj", "model.layers.77.mlp.experts.112.down_proj", "model.layers.77.mlp.experts.113.down_proj", "model.layers.77.mlp.experts.114.down_proj", "model.layers.77.mlp.experts.115.down_proj", "model.layers.77.mlp.experts.116.down_proj", "model.layers.77.mlp.experts.117.down_proj", "model.layers.77.mlp.experts.118.down_proj", "model.layers.77.mlp.experts.119.down_proj", "model.layers.77.mlp.experts.120.down_proj", "model.layers.77.mlp.experts.121.down_proj", "model.layers.77.mlp.experts.122.down_proj", "model.layers.77.mlp.experts.123.down_proj", "model.layers.77.mlp.experts.124.down_proj", "model.layers.77.mlp.experts.125.down_proj", "model.layers.77.mlp.experts.126.down_proj", "model.layers.77.mlp.experts.127.down_proj", "model.layers.77.mlp.experts.128.down_proj", "model.layers.77.mlp.experts.129.down_proj", "model.layers.77.mlp.experts.130.down_proj", "model.layers.77.mlp.experts.131.down_proj", "model.layers.77.mlp.experts.132.down_proj", "model.layers.77.mlp.experts.133.down_proj", "model.layers.77.mlp.experts.134.down_proj", "model.layers.77.mlp.experts.135.down_proj", "model.layers.77.mlp.experts.136.down_proj", "model.layers.77.mlp.experts.137.down_proj", "model.layers.77.mlp.experts.138.down_proj", "model.layers.77.mlp.experts.139.down_proj", "model.layers.77.mlp.experts.140.down_proj", "model.layers.77.mlp.experts.141.down_proj", "model.layers.77.mlp.experts.142.down_proj", "model.layers.77.mlp.experts.143.down_proj", "model.layers.77.mlp.experts.144.down_proj", "model.layers.77.mlp.experts.145.down_proj", "model.layers.77.mlp.experts.146.down_proj", "model.layers.77.mlp.experts.147.down_proj", "model.layers.77.mlp.experts.148.down_proj", "model.layers.77.mlp.experts.149.down_proj", "model.layers.77.mlp.experts.150.down_proj", "model.layers.77.mlp.experts.151.down_proj", "model.layers.77.mlp.experts.152.down_proj", "model.layers.77.mlp.experts.153.down_proj", "model.layers.77.mlp.experts.154.down_proj", "model.layers.77.mlp.experts.155.down_proj", "model.layers.77.mlp.experts.156.down_proj", "model.layers.77.mlp.experts.157.down_proj", "model.layers.77.mlp.experts.158.down_proj", "model.layers.77.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 8.5335224866874e-06, "dbits": 1258291200 }, { "dkld": -6.334623321890831e-06, "dbits": 2516582400 } ] }, { "idx": 465, "layers": [ "model.layers.78.self_attn.q_proj" ], "candidates": [ { "dkld": 1.4277873560786247e-05, "dbits": 62914560 }, { "dkld": 1.8496788106859077e-05, "dbits": 125829120 } ] }, { "idx": 466, "layers": [ "model.layers.78.self_attn.k_proj", "model.layers.78.self_attn.v_proj" ], "candidates": [ { "dkld": 4.72350511700019e-06, "dbits": 10485760 }, { "dkld": -2.2168597206473004e-05, "dbits": 20971520 } ] }, { "idx": 467, "layers": [ "model.layers.78.self_attn.o_proj" ], "candidates": [ { "dkld": 2.0271330140531757e-05, "dbits": 62914560 }, { "dkld": 3.9752735756338337e-05, "dbits": 125829120 } ] }, { "idx": 468, "layers": [ "model.layers.78.mlp.shared_experts.gate_proj", "model.layers.78.mlp.shared_experts.up_proj", "model.layers.78.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 6.5839383751164354e-06, "dbits": 23592960 }, { "dkld": 3.7230760790409045e-05, "dbits": 47185920 } ] }, { "idx": 469, "layers": [ "model.layers.78.mlp.experts.0.gate_proj", "model.layers.78.mlp.experts.1.gate_proj", "model.layers.78.mlp.experts.2.gate_proj", "model.layers.78.mlp.experts.3.gate_proj", "model.layers.78.mlp.experts.4.gate_proj", "model.layers.78.mlp.experts.5.gate_proj", "model.layers.78.mlp.experts.6.gate_proj", "model.layers.78.mlp.experts.7.gate_proj", "model.layers.78.mlp.experts.8.gate_proj", "model.layers.78.mlp.experts.9.gate_proj", "model.layers.78.mlp.experts.10.gate_proj", "model.layers.78.mlp.experts.11.gate_proj", "model.layers.78.mlp.experts.12.gate_proj", "model.layers.78.mlp.experts.13.gate_proj", "model.layers.78.mlp.experts.14.gate_proj", "model.layers.78.mlp.experts.15.gate_proj", "model.layers.78.mlp.experts.16.gate_proj", "model.layers.78.mlp.experts.17.gate_proj", "model.layers.78.mlp.experts.18.gate_proj", "model.layers.78.mlp.experts.19.gate_proj", "model.layers.78.mlp.experts.20.gate_proj", "model.layers.78.mlp.experts.21.gate_proj", "model.layers.78.mlp.experts.22.gate_proj", "model.layers.78.mlp.experts.23.gate_proj", "model.layers.78.mlp.experts.24.gate_proj", "model.layers.78.mlp.experts.25.gate_proj", "model.layers.78.mlp.experts.26.gate_proj", "model.layers.78.mlp.experts.27.gate_proj", "model.layers.78.mlp.experts.28.gate_proj", "model.layers.78.mlp.experts.29.gate_proj", "model.layers.78.mlp.experts.30.gate_proj", "model.layers.78.mlp.experts.31.gate_proj", "model.layers.78.mlp.experts.32.gate_proj", "model.layers.78.mlp.experts.33.gate_proj", "model.layers.78.mlp.experts.34.gate_proj", "model.layers.78.mlp.experts.35.gate_proj", "model.layers.78.mlp.experts.36.gate_proj", "model.layers.78.mlp.experts.37.gate_proj", "model.layers.78.mlp.experts.38.gate_proj", "model.layers.78.mlp.experts.39.gate_proj", "model.layers.78.mlp.experts.40.gate_proj", "model.layers.78.mlp.experts.41.gate_proj", "model.layers.78.mlp.experts.42.gate_proj", "model.layers.78.mlp.experts.43.gate_proj", "model.layers.78.mlp.experts.44.gate_proj", "model.layers.78.mlp.experts.45.gate_proj", "model.layers.78.mlp.experts.46.gate_proj", "model.layers.78.mlp.experts.47.gate_proj", "model.layers.78.mlp.experts.48.gate_proj", "model.layers.78.mlp.experts.49.gate_proj", "model.layers.78.mlp.experts.50.gate_proj", "model.layers.78.mlp.experts.51.gate_proj", "model.layers.78.mlp.experts.52.gate_proj", "model.layers.78.mlp.experts.53.gate_proj", "model.layers.78.mlp.experts.54.gate_proj", "model.layers.78.mlp.experts.55.gate_proj", "model.layers.78.mlp.experts.56.gate_proj", "model.layers.78.mlp.experts.57.gate_proj", "model.layers.78.mlp.experts.58.gate_proj", "model.layers.78.mlp.experts.59.gate_proj", "model.layers.78.mlp.experts.60.gate_proj", "model.layers.78.mlp.experts.61.gate_proj", "model.layers.78.mlp.experts.62.gate_proj", "model.layers.78.mlp.experts.63.gate_proj", "model.layers.78.mlp.experts.64.gate_proj", "model.layers.78.mlp.experts.65.gate_proj", "model.layers.78.mlp.experts.66.gate_proj", "model.layers.78.mlp.experts.67.gate_proj", "model.layers.78.mlp.experts.68.gate_proj", "model.layers.78.mlp.experts.69.gate_proj", "model.layers.78.mlp.experts.70.gate_proj", "model.layers.78.mlp.experts.71.gate_proj", "model.layers.78.mlp.experts.72.gate_proj", "model.layers.78.mlp.experts.73.gate_proj", "model.layers.78.mlp.experts.74.gate_proj", "model.layers.78.mlp.experts.75.gate_proj", "model.layers.78.mlp.experts.76.gate_proj", "model.layers.78.mlp.experts.77.gate_proj", "model.layers.78.mlp.experts.78.gate_proj", "model.layers.78.mlp.experts.79.gate_proj", "model.layers.78.mlp.experts.80.gate_proj", "model.layers.78.mlp.experts.81.gate_proj", "model.layers.78.mlp.experts.82.gate_proj", "model.layers.78.mlp.experts.83.gate_proj", "model.layers.78.mlp.experts.84.gate_proj", "model.layers.78.mlp.experts.85.gate_proj", "model.layers.78.mlp.experts.86.gate_proj", "model.layers.78.mlp.experts.87.gate_proj", "model.layers.78.mlp.experts.88.gate_proj", "model.layers.78.mlp.experts.89.gate_proj", "model.layers.78.mlp.experts.90.gate_proj", "model.layers.78.mlp.experts.91.gate_proj", "model.layers.78.mlp.experts.92.gate_proj", "model.layers.78.mlp.experts.93.gate_proj", "model.layers.78.mlp.experts.94.gate_proj", "model.layers.78.mlp.experts.95.gate_proj", "model.layers.78.mlp.experts.96.gate_proj", "model.layers.78.mlp.experts.97.gate_proj", "model.layers.78.mlp.experts.98.gate_proj", "model.layers.78.mlp.experts.99.gate_proj", "model.layers.78.mlp.experts.100.gate_proj", "model.layers.78.mlp.experts.101.gate_proj", "model.layers.78.mlp.experts.102.gate_proj", "model.layers.78.mlp.experts.103.gate_proj", "model.layers.78.mlp.experts.104.gate_proj", "model.layers.78.mlp.experts.105.gate_proj", "model.layers.78.mlp.experts.106.gate_proj", "model.layers.78.mlp.experts.107.gate_proj", "model.layers.78.mlp.experts.108.gate_proj", "model.layers.78.mlp.experts.109.gate_proj", "model.layers.78.mlp.experts.110.gate_proj", "model.layers.78.mlp.experts.111.gate_proj", "model.layers.78.mlp.experts.112.gate_proj", "model.layers.78.mlp.experts.113.gate_proj", "model.layers.78.mlp.experts.114.gate_proj", "model.layers.78.mlp.experts.115.gate_proj", "model.layers.78.mlp.experts.116.gate_proj", "model.layers.78.mlp.experts.117.gate_proj", "model.layers.78.mlp.experts.118.gate_proj", "model.layers.78.mlp.experts.119.gate_proj", "model.layers.78.mlp.experts.120.gate_proj", "model.layers.78.mlp.experts.121.gate_proj", "model.layers.78.mlp.experts.122.gate_proj", "model.layers.78.mlp.experts.123.gate_proj", "model.layers.78.mlp.experts.124.gate_proj", "model.layers.78.mlp.experts.125.gate_proj", "model.layers.78.mlp.experts.126.gate_proj", "model.layers.78.mlp.experts.127.gate_proj", "model.layers.78.mlp.experts.128.gate_proj", "model.layers.78.mlp.experts.129.gate_proj", "model.layers.78.mlp.experts.130.gate_proj", "model.layers.78.mlp.experts.131.gate_proj", "model.layers.78.mlp.experts.132.gate_proj", "model.layers.78.mlp.experts.133.gate_proj", "model.layers.78.mlp.experts.134.gate_proj", "model.layers.78.mlp.experts.135.gate_proj", "model.layers.78.mlp.experts.136.gate_proj", "model.layers.78.mlp.experts.137.gate_proj", "model.layers.78.mlp.experts.138.gate_proj", "model.layers.78.mlp.experts.139.gate_proj", "model.layers.78.mlp.experts.140.gate_proj", "model.layers.78.mlp.experts.141.gate_proj", "model.layers.78.mlp.experts.142.gate_proj", "model.layers.78.mlp.experts.143.gate_proj", "model.layers.78.mlp.experts.144.gate_proj", "model.layers.78.mlp.experts.145.gate_proj", "model.layers.78.mlp.experts.146.gate_proj", "model.layers.78.mlp.experts.147.gate_proj", "model.layers.78.mlp.experts.148.gate_proj", "model.layers.78.mlp.experts.149.gate_proj", "model.layers.78.mlp.experts.150.gate_proj", "model.layers.78.mlp.experts.151.gate_proj", "model.layers.78.mlp.experts.152.gate_proj", "model.layers.78.mlp.experts.153.gate_proj", "model.layers.78.mlp.experts.154.gate_proj", "model.layers.78.mlp.experts.155.gate_proj", "model.layers.78.mlp.experts.156.gate_proj", "model.layers.78.mlp.experts.157.gate_proj", "model.layers.78.mlp.experts.158.gate_proj", "model.layers.78.mlp.experts.159.gate_proj", "model.layers.78.mlp.experts.0.up_proj", "model.layers.78.mlp.experts.1.up_proj", "model.layers.78.mlp.experts.2.up_proj", "model.layers.78.mlp.experts.3.up_proj", "model.layers.78.mlp.experts.4.up_proj", "model.layers.78.mlp.experts.5.up_proj", "model.layers.78.mlp.experts.6.up_proj", "model.layers.78.mlp.experts.7.up_proj", "model.layers.78.mlp.experts.8.up_proj", "model.layers.78.mlp.experts.9.up_proj", "model.layers.78.mlp.experts.10.up_proj", "model.layers.78.mlp.experts.11.up_proj", "model.layers.78.mlp.experts.12.up_proj", "model.layers.78.mlp.experts.13.up_proj", "model.layers.78.mlp.experts.14.up_proj", "model.layers.78.mlp.experts.15.up_proj", "model.layers.78.mlp.experts.16.up_proj", "model.layers.78.mlp.experts.17.up_proj", "model.layers.78.mlp.experts.18.up_proj", "model.layers.78.mlp.experts.19.up_proj", "model.layers.78.mlp.experts.20.up_proj", "model.layers.78.mlp.experts.21.up_proj", "model.layers.78.mlp.experts.22.up_proj", "model.layers.78.mlp.experts.23.up_proj", "model.layers.78.mlp.experts.24.up_proj", "model.layers.78.mlp.experts.25.up_proj", "model.layers.78.mlp.experts.26.up_proj", "model.layers.78.mlp.experts.27.up_proj", "model.layers.78.mlp.experts.28.up_proj", "model.layers.78.mlp.experts.29.up_proj", "model.layers.78.mlp.experts.30.up_proj", "model.layers.78.mlp.experts.31.up_proj", "model.layers.78.mlp.experts.32.up_proj", "model.layers.78.mlp.experts.33.up_proj", "model.layers.78.mlp.experts.34.up_proj", "model.layers.78.mlp.experts.35.up_proj", "model.layers.78.mlp.experts.36.up_proj", "model.layers.78.mlp.experts.37.up_proj", "model.layers.78.mlp.experts.38.up_proj", "model.layers.78.mlp.experts.39.up_proj", "model.layers.78.mlp.experts.40.up_proj", "model.layers.78.mlp.experts.41.up_proj", "model.layers.78.mlp.experts.42.up_proj", "model.layers.78.mlp.experts.43.up_proj", "model.layers.78.mlp.experts.44.up_proj", "model.layers.78.mlp.experts.45.up_proj", "model.layers.78.mlp.experts.46.up_proj", "model.layers.78.mlp.experts.47.up_proj", "model.layers.78.mlp.experts.48.up_proj", "model.layers.78.mlp.experts.49.up_proj", "model.layers.78.mlp.experts.50.up_proj", "model.layers.78.mlp.experts.51.up_proj", "model.layers.78.mlp.experts.52.up_proj", "model.layers.78.mlp.experts.53.up_proj", "model.layers.78.mlp.experts.54.up_proj", "model.layers.78.mlp.experts.55.up_proj", "model.layers.78.mlp.experts.56.up_proj", "model.layers.78.mlp.experts.57.up_proj", "model.layers.78.mlp.experts.58.up_proj", "model.layers.78.mlp.experts.59.up_proj", "model.layers.78.mlp.experts.60.up_proj", "model.layers.78.mlp.experts.61.up_proj", "model.layers.78.mlp.experts.62.up_proj", "model.layers.78.mlp.experts.63.up_proj", "model.layers.78.mlp.experts.64.up_proj", "model.layers.78.mlp.experts.65.up_proj", "model.layers.78.mlp.experts.66.up_proj", "model.layers.78.mlp.experts.67.up_proj", "model.layers.78.mlp.experts.68.up_proj", "model.layers.78.mlp.experts.69.up_proj", "model.layers.78.mlp.experts.70.up_proj", "model.layers.78.mlp.experts.71.up_proj", "model.layers.78.mlp.experts.72.up_proj", "model.layers.78.mlp.experts.73.up_proj", "model.layers.78.mlp.experts.74.up_proj", "model.layers.78.mlp.experts.75.up_proj", "model.layers.78.mlp.experts.76.up_proj", "model.layers.78.mlp.experts.77.up_proj", "model.layers.78.mlp.experts.78.up_proj", "model.layers.78.mlp.experts.79.up_proj", "model.layers.78.mlp.experts.80.up_proj", "model.layers.78.mlp.experts.81.up_proj", "model.layers.78.mlp.experts.82.up_proj", "model.layers.78.mlp.experts.83.up_proj", "model.layers.78.mlp.experts.84.up_proj", "model.layers.78.mlp.experts.85.up_proj", "model.layers.78.mlp.experts.86.up_proj", "model.layers.78.mlp.experts.87.up_proj", "model.layers.78.mlp.experts.88.up_proj", "model.layers.78.mlp.experts.89.up_proj", "model.layers.78.mlp.experts.90.up_proj", "model.layers.78.mlp.experts.91.up_proj", "model.layers.78.mlp.experts.92.up_proj", "model.layers.78.mlp.experts.93.up_proj", "model.layers.78.mlp.experts.94.up_proj", "model.layers.78.mlp.experts.95.up_proj", "model.layers.78.mlp.experts.96.up_proj", "model.layers.78.mlp.experts.97.up_proj", "model.layers.78.mlp.experts.98.up_proj", "model.layers.78.mlp.experts.99.up_proj", "model.layers.78.mlp.experts.100.up_proj", "model.layers.78.mlp.experts.101.up_proj", "model.layers.78.mlp.experts.102.up_proj", "model.layers.78.mlp.experts.103.up_proj", "model.layers.78.mlp.experts.104.up_proj", "model.layers.78.mlp.experts.105.up_proj", "model.layers.78.mlp.experts.106.up_proj", "model.layers.78.mlp.experts.107.up_proj", "model.layers.78.mlp.experts.108.up_proj", "model.layers.78.mlp.experts.109.up_proj", "model.layers.78.mlp.experts.110.up_proj", "model.layers.78.mlp.experts.111.up_proj", "model.layers.78.mlp.experts.112.up_proj", "model.layers.78.mlp.experts.113.up_proj", "model.layers.78.mlp.experts.114.up_proj", "model.layers.78.mlp.experts.115.up_proj", "model.layers.78.mlp.experts.116.up_proj", "model.layers.78.mlp.experts.117.up_proj", "model.layers.78.mlp.experts.118.up_proj", "model.layers.78.mlp.experts.119.up_proj", "model.layers.78.mlp.experts.120.up_proj", "model.layers.78.mlp.experts.121.up_proj", "model.layers.78.mlp.experts.122.up_proj", "model.layers.78.mlp.experts.123.up_proj", "model.layers.78.mlp.experts.124.up_proj", "model.layers.78.mlp.experts.125.up_proj", "model.layers.78.mlp.experts.126.up_proj", "model.layers.78.mlp.experts.127.up_proj", "model.layers.78.mlp.experts.128.up_proj", "model.layers.78.mlp.experts.129.up_proj", "model.layers.78.mlp.experts.130.up_proj", "model.layers.78.mlp.experts.131.up_proj", "model.layers.78.mlp.experts.132.up_proj", "model.layers.78.mlp.experts.133.up_proj", "model.layers.78.mlp.experts.134.up_proj", "model.layers.78.mlp.experts.135.up_proj", "model.layers.78.mlp.experts.136.up_proj", "model.layers.78.mlp.experts.137.up_proj", "model.layers.78.mlp.experts.138.up_proj", "model.layers.78.mlp.experts.139.up_proj", "model.layers.78.mlp.experts.140.up_proj", "model.layers.78.mlp.experts.141.up_proj", "model.layers.78.mlp.experts.142.up_proj", "model.layers.78.mlp.experts.143.up_proj", "model.layers.78.mlp.experts.144.up_proj", "model.layers.78.mlp.experts.145.up_proj", "model.layers.78.mlp.experts.146.up_proj", "model.layers.78.mlp.experts.147.up_proj", "model.layers.78.mlp.experts.148.up_proj", "model.layers.78.mlp.experts.149.up_proj", "model.layers.78.mlp.experts.150.up_proj", "model.layers.78.mlp.experts.151.up_proj", "model.layers.78.mlp.experts.152.up_proj", "model.layers.78.mlp.experts.153.up_proj", "model.layers.78.mlp.experts.154.up_proj", "model.layers.78.mlp.experts.155.up_proj", "model.layers.78.mlp.experts.156.up_proj", "model.layers.78.mlp.experts.157.up_proj", "model.layers.78.mlp.experts.158.up_proj", "model.layers.78.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 7.679546251894431e-06, "dbits": 2516582400 }, { "dkld": 4.8481160774827e-06, "dbits": 5033164800 } ] }, { "idx": 470, "layers": [ "model.layers.78.mlp.experts.0.down_proj", "model.layers.78.mlp.experts.1.down_proj", "model.layers.78.mlp.experts.2.down_proj", "model.layers.78.mlp.experts.3.down_proj", "model.layers.78.mlp.experts.4.down_proj", "model.layers.78.mlp.experts.5.down_proj", "model.layers.78.mlp.experts.6.down_proj", "model.layers.78.mlp.experts.7.down_proj", "model.layers.78.mlp.experts.8.down_proj", "model.layers.78.mlp.experts.9.down_proj", "model.layers.78.mlp.experts.10.down_proj", "model.layers.78.mlp.experts.11.down_proj", "model.layers.78.mlp.experts.12.down_proj", "model.layers.78.mlp.experts.13.down_proj", "model.layers.78.mlp.experts.14.down_proj", "model.layers.78.mlp.experts.15.down_proj", "model.layers.78.mlp.experts.16.down_proj", "model.layers.78.mlp.experts.17.down_proj", "model.layers.78.mlp.experts.18.down_proj", "model.layers.78.mlp.experts.19.down_proj", "model.layers.78.mlp.experts.20.down_proj", "model.layers.78.mlp.experts.21.down_proj", "model.layers.78.mlp.experts.22.down_proj", "model.layers.78.mlp.experts.23.down_proj", "model.layers.78.mlp.experts.24.down_proj", "model.layers.78.mlp.experts.25.down_proj", "model.layers.78.mlp.experts.26.down_proj", "model.layers.78.mlp.experts.27.down_proj", "model.layers.78.mlp.experts.28.down_proj", "model.layers.78.mlp.experts.29.down_proj", "model.layers.78.mlp.experts.30.down_proj", "model.layers.78.mlp.experts.31.down_proj", "model.layers.78.mlp.experts.32.down_proj", "model.layers.78.mlp.experts.33.down_proj", "model.layers.78.mlp.experts.34.down_proj", "model.layers.78.mlp.experts.35.down_proj", "model.layers.78.mlp.experts.36.down_proj", "model.layers.78.mlp.experts.37.down_proj", "model.layers.78.mlp.experts.38.down_proj", "model.layers.78.mlp.experts.39.down_proj", "model.layers.78.mlp.experts.40.down_proj", "model.layers.78.mlp.experts.41.down_proj", "model.layers.78.mlp.experts.42.down_proj", "model.layers.78.mlp.experts.43.down_proj", "model.layers.78.mlp.experts.44.down_proj", "model.layers.78.mlp.experts.45.down_proj", "model.layers.78.mlp.experts.46.down_proj", "model.layers.78.mlp.experts.47.down_proj", "model.layers.78.mlp.experts.48.down_proj", "model.layers.78.mlp.experts.49.down_proj", "model.layers.78.mlp.experts.50.down_proj", "model.layers.78.mlp.experts.51.down_proj", "model.layers.78.mlp.experts.52.down_proj", "model.layers.78.mlp.experts.53.down_proj", "model.layers.78.mlp.experts.54.down_proj", "model.layers.78.mlp.experts.55.down_proj", "model.layers.78.mlp.experts.56.down_proj", "model.layers.78.mlp.experts.57.down_proj", "model.layers.78.mlp.experts.58.down_proj", "model.layers.78.mlp.experts.59.down_proj", "model.layers.78.mlp.experts.60.down_proj", "model.layers.78.mlp.experts.61.down_proj", "model.layers.78.mlp.experts.62.down_proj", "model.layers.78.mlp.experts.63.down_proj", "model.layers.78.mlp.experts.64.down_proj", "model.layers.78.mlp.experts.65.down_proj", "model.layers.78.mlp.experts.66.down_proj", "model.layers.78.mlp.experts.67.down_proj", "model.layers.78.mlp.experts.68.down_proj", "model.layers.78.mlp.experts.69.down_proj", "model.layers.78.mlp.experts.70.down_proj", "model.layers.78.mlp.experts.71.down_proj", "model.layers.78.mlp.experts.72.down_proj", "model.layers.78.mlp.experts.73.down_proj", "model.layers.78.mlp.experts.74.down_proj", "model.layers.78.mlp.experts.75.down_proj", "model.layers.78.mlp.experts.76.down_proj", "model.layers.78.mlp.experts.77.down_proj", "model.layers.78.mlp.experts.78.down_proj", "model.layers.78.mlp.experts.79.down_proj", "model.layers.78.mlp.experts.80.down_proj", "model.layers.78.mlp.experts.81.down_proj", "model.layers.78.mlp.experts.82.down_proj", "model.layers.78.mlp.experts.83.down_proj", "model.layers.78.mlp.experts.84.down_proj", "model.layers.78.mlp.experts.85.down_proj", "model.layers.78.mlp.experts.86.down_proj", "model.layers.78.mlp.experts.87.down_proj", "model.layers.78.mlp.experts.88.down_proj", "model.layers.78.mlp.experts.89.down_proj", "model.layers.78.mlp.experts.90.down_proj", "model.layers.78.mlp.experts.91.down_proj", "model.layers.78.mlp.experts.92.down_proj", "model.layers.78.mlp.experts.93.down_proj", "model.layers.78.mlp.experts.94.down_proj", "model.layers.78.mlp.experts.95.down_proj", "model.layers.78.mlp.experts.96.down_proj", "model.layers.78.mlp.experts.97.down_proj", "model.layers.78.mlp.experts.98.down_proj", "model.layers.78.mlp.experts.99.down_proj", "model.layers.78.mlp.experts.100.down_proj", "model.layers.78.mlp.experts.101.down_proj", "model.layers.78.mlp.experts.102.down_proj", "model.layers.78.mlp.experts.103.down_proj", "model.layers.78.mlp.experts.104.down_proj", "model.layers.78.mlp.experts.105.down_proj", "model.layers.78.mlp.experts.106.down_proj", "model.layers.78.mlp.experts.107.down_proj", "model.layers.78.mlp.experts.108.down_proj", "model.layers.78.mlp.experts.109.down_proj", "model.layers.78.mlp.experts.110.down_proj", "model.layers.78.mlp.experts.111.down_proj", "model.layers.78.mlp.experts.112.down_proj", "model.layers.78.mlp.experts.113.down_proj", "model.layers.78.mlp.experts.114.down_proj", "model.layers.78.mlp.experts.115.down_proj", "model.layers.78.mlp.experts.116.down_proj", "model.layers.78.mlp.experts.117.down_proj", "model.layers.78.mlp.experts.118.down_proj", "model.layers.78.mlp.experts.119.down_proj", "model.layers.78.mlp.experts.120.down_proj", "model.layers.78.mlp.experts.121.down_proj", "model.layers.78.mlp.experts.122.down_proj", "model.layers.78.mlp.experts.123.down_proj", "model.layers.78.mlp.experts.124.down_proj", "model.layers.78.mlp.experts.125.down_proj", "model.layers.78.mlp.experts.126.down_proj", "model.layers.78.mlp.experts.127.down_proj", "model.layers.78.mlp.experts.128.down_proj", "model.layers.78.mlp.experts.129.down_proj", "model.layers.78.mlp.experts.130.down_proj", "model.layers.78.mlp.experts.131.down_proj", "model.layers.78.mlp.experts.132.down_proj", "model.layers.78.mlp.experts.133.down_proj", "model.layers.78.mlp.experts.134.down_proj", "model.layers.78.mlp.experts.135.down_proj", "model.layers.78.mlp.experts.136.down_proj", "model.layers.78.mlp.experts.137.down_proj", "model.layers.78.mlp.experts.138.down_proj", "model.layers.78.mlp.experts.139.down_proj", "model.layers.78.mlp.experts.140.down_proj", "model.layers.78.mlp.experts.141.down_proj", "model.layers.78.mlp.experts.142.down_proj", "model.layers.78.mlp.experts.143.down_proj", "model.layers.78.mlp.experts.144.down_proj", "model.layers.78.mlp.experts.145.down_proj", "model.layers.78.mlp.experts.146.down_proj", "model.layers.78.mlp.experts.147.down_proj", "model.layers.78.mlp.experts.148.down_proj", "model.layers.78.mlp.experts.149.down_proj", "model.layers.78.mlp.experts.150.down_proj", "model.layers.78.mlp.experts.151.down_proj", "model.layers.78.mlp.experts.152.down_proj", "model.layers.78.mlp.experts.153.down_proj", "model.layers.78.mlp.experts.154.down_proj", "model.layers.78.mlp.experts.155.down_proj", "model.layers.78.mlp.experts.156.down_proj", "model.layers.78.mlp.experts.157.down_proj", "model.layers.78.mlp.experts.158.down_proj", "model.layers.78.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.339761704205426e-06, "dbits": 1258291200 }, { "dkld": -1.785093918442622e-05, "dbits": 2516582400 } ] }, { "idx": 471, "layers": [ "model.layers.79.self_attn.q_proj" ], "candidates": [ { "dkld": 1.9829417578876712e-05, "dbits": 62914560 }, { "dkld": 6.194901652635532e-06, "dbits": 125829120 } ] }, { "idx": 472, "layers": [ "model.layers.79.self_attn.k_proj", "model.layers.79.self_attn.v_proj" ], "candidates": [ { "dkld": -0.0001557020470499982, "dbits": 10485760 }, { "dkld": -0.0001919494476169334, "dbits": 20971520 } ] }, { "idx": 473, "layers": [ "model.layers.79.self_attn.o_proj" ], "candidates": [ { "dkld": -1.9184057600795876e-05, "dbits": 62914560 }, { "dkld": 3.282446414232254e-06, "dbits": 125829120 } ] }, { "idx": 474, "layers": [ "model.layers.79.mlp.shared_experts.gate_proj", "model.layers.79.mlp.shared_experts.up_proj", "model.layers.79.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 3.610968124121566e-05, "dbits": 23592960 }, { "dkld": 2.0053749904037216e-05, "dbits": 47185920 } ] }, { "idx": 475, "layers": [ "model.layers.79.mlp.experts.0.gate_proj", "model.layers.79.mlp.experts.1.gate_proj", "model.layers.79.mlp.experts.2.gate_proj", "model.layers.79.mlp.experts.3.gate_proj", "model.layers.79.mlp.experts.4.gate_proj", "model.layers.79.mlp.experts.5.gate_proj", "model.layers.79.mlp.experts.6.gate_proj", "model.layers.79.mlp.experts.7.gate_proj", "model.layers.79.mlp.experts.8.gate_proj", "model.layers.79.mlp.experts.9.gate_proj", "model.layers.79.mlp.experts.10.gate_proj", "model.layers.79.mlp.experts.11.gate_proj", "model.layers.79.mlp.experts.12.gate_proj", "model.layers.79.mlp.experts.13.gate_proj", "model.layers.79.mlp.experts.14.gate_proj", "model.layers.79.mlp.experts.15.gate_proj", "model.layers.79.mlp.experts.16.gate_proj", "model.layers.79.mlp.experts.17.gate_proj", "model.layers.79.mlp.experts.18.gate_proj", "model.layers.79.mlp.experts.19.gate_proj", "model.layers.79.mlp.experts.20.gate_proj", "model.layers.79.mlp.experts.21.gate_proj", "model.layers.79.mlp.experts.22.gate_proj", "model.layers.79.mlp.experts.23.gate_proj", "model.layers.79.mlp.experts.24.gate_proj", "model.layers.79.mlp.experts.25.gate_proj", "model.layers.79.mlp.experts.26.gate_proj", "model.layers.79.mlp.experts.27.gate_proj", "model.layers.79.mlp.experts.28.gate_proj", "model.layers.79.mlp.experts.29.gate_proj", "model.layers.79.mlp.experts.30.gate_proj", "model.layers.79.mlp.experts.31.gate_proj", "model.layers.79.mlp.experts.32.gate_proj", "model.layers.79.mlp.experts.33.gate_proj", "model.layers.79.mlp.experts.34.gate_proj", "model.layers.79.mlp.experts.35.gate_proj", "model.layers.79.mlp.experts.36.gate_proj", "model.layers.79.mlp.experts.37.gate_proj", "model.layers.79.mlp.experts.38.gate_proj", "model.layers.79.mlp.experts.39.gate_proj", "model.layers.79.mlp.experts.40.gate_proj", "model.layers.79.mlp.experts.41.gate_proj", "model.layers.79.mlp.experts.42.gate_proj", "model.layers.79.mlp.experts.43.gate_proj", "model.layers.79.mlp.experts.44.gate_proj", "model.layers.79.mlp.experts.45.gate_proj", "model.layers.79.mlp.experts.46.gate_proj", "model.layers.79.mlp.experts.47.gate_proj", "model.layers.79.mlp.experts.48.gate_proj", "model.layers.79.mlp.experts.49.gate_proj", "model.layers.79.mlp.experts.50.gate_proj", "model.layers.79.mlp.experts.51.gate_proj", "model.layers.79.mlp.experts.52.gate_proj", "model.layers.79.mlp.experts.53.gate_proj", "model.layers.79.mlp.experts.54.gate_proj", "model.layers.79.mlp.experts.55.gate_proj", "model.layers.79.mlp.experts.56.gate_proj", "model.layers.79.mlp.experts.57.gate_proj", "model.layers.79.mlp.experts.58.gate_proj", "model.layers.79.mlp.experts.59.gate_proj", "model.layers.79.mlp.experts.60.gate_proj", "model.layers.79.mlp.experts.61.gate_proj", "model.layers.79.mlp.experts.62.gate_proj", "model.layers.79.mlp.experts.63.gate_proj", "model.layers.79.mlp.experts.64.gate_proj", "model.layers.79.mlp.experts.65.gate_proj", "model.layers.79.mlp.experts.66.gate_proj", "model.layers.79.mlp.experts.67.gate_proj", "model.layers.79.mlp.experts.68.gate_proj", "model.layers.79.mlp.experts.69.gate_proj", "model.layers.79.mlp.experts.70.gate_proj", "model.layers.79.mlp.experts.71.gate_proj", "model.layers.79.mlp.experts.72.gate_proj", "model.layers.79.mlp.experts.73.gate_proj", "model.layers.79.mlp.experts.74.gate_proj", "model.layers.79.mlp.experts.75.gate_proj", "model.layers.79.mlp.experts.76.gate_proj", "model.layers.79.mlp.experts.77.gate_proj", "model.layers.79.mlp.experts.78.gate_proj", "model.layers.79.mlp.experts.79.gate_proj", "model.layers.79.mlp.experts.80.gate_proj", "model.layers.79.mlp.experts.81.gate_proj", "model.layers.79.mlp.experts.82.gate_proj", "model.layers.79.mlp.experts.83.gate_proj", "model.layers.79.mlp.experts.84.gate_proj", "model.layers.79.mlp.experts.85.gate_proj", "model.layers.79.mlp.experts.86.gate_proj", "model.layers.79.mlp.experts.87.gate_proj", "model.layers.79.mlp.experts.88.gate_proj", "model.layers.79.mlp.experts.89.gate_proj", "model.layers.79.mlp.experts.90.gate_proj", "model.layers.79.mlp.experts.91.gate_proj", "model.layers.79.mlp.experts.92.gate_proj", "model.layers.79.mlp.experts.93.gate_proj", "model.layers.79.mlp.experts.94.gate_proj", "model.layers.79.mlp.experts.95.gate_proj", "model.layers.79.mlp.experts.96.gate_proj", "model.layers.79.mlp.experts.97.gate_proj", "model.layers.79.mlp.experts.98.gate_proj", "model.layers.79.mlp.experts.99.gate_proj", "model.layers.79.mlp.experts.100.gate_proj", "model.layers.79.mlp.experts.101.gate_proj", "model.layers.79.mlp.experts.102.gate_proj", "model.layers.79.mlp.experts.103.gate_proj", "model.layers.79.mlp.experts.104.gate_proj", "model.layers.79.mlp.experts.105.gate_proj", "model.layers.79.mlp.experts.106.gate_proj", "model.layers.79.mlp.experts.107.gate_proj", "model.layers.79.mlp.experts.108.gate_proj", "model.layers.79.mlp.experts.109.gate_proj", "model.layers.79.mlp.experts.110.gate_proj", "model.layers.79.mlp.experts.111.gate_proj", "model.layers.79.mlp.experts.112.gate_proj", "model.layers.79.mlp.experts.113.gate_proj", "model.layers.79.mlp.experts.114.gate_proj", "model.layers.79.mlp.experts.115.gate_proj", "model.layers.79.mlp.experts.116.gate_proj", "model.layers.79.mlp.experts.117.gate_proj", "model.layers.79.mlp.experts.118.gate_proj", "model.layers.79.mlp.experts.119.gate_proj", "model.layers.79.mlp.experts.120.gate_proj", "model.layers.79.mlp.experts.121.gate_proj", "model.layers.79.mlp.experts.122.gate_proj", "model.layers.79.mlp.experts.123.gate_proj", "model.layers.79.mlp.experts.124.gate_proj", "model.layers.79.mlp.experts.125.gate_proj", "model.layers.79.mlp.experts.126.gate_proj", "model.layers.79.mlp.experts.127.gate_proj", "model.layers.79.mlp.experts.128.gate_proj", "model.layers.79.mlp.experts.129.gate_proj", "model.layers.79.mlp.experts.130.gate_proj", "model.layers.79.mlp.experts.131.gate_proj", "model.layers.79.mlp.experts.132.gate_proj", "model.layers.79.mlp.experts.133.gate_proj", "model.layers.79.mlp.experts.134.gate_proj", "model.layers.79.mlp.experts.135.gate_proj", "model.layers.79.mlp.experts.136.gate_proj", "model.layers.79.mlp.experts.137.gate_proj", "model.layers.79.mlp.experts.138.gate_proj", "model.layers.79.mlp.experts.139.gate_proj", "model.layers.79.mlp.experts.140.gate_proj", "model.layers.79.mlp.experts.141.gate_proj", "model.layers.79.mlp.experts.142.gate_proj", "model.layers.79.mlp.experts.143.gate_proj", "model.layers.79.mlp.experts.144.gate_proj", "model.layers.79.mlp.experts.145.gate_proj", "model.layers.79.mlp.experts.146.gate_proj", "model.layers.79.mlp.experts.147.gate_proj", "model.layers.79.mlp.experts.148.gate_proj", "model.layers.79.mlp.experts.149.gate_proj", "model.layers.79.mlp.experts.150.gate_proj", "model.layers.79.mlp.experts.151.gate_proj", "model.layers.79.mlp.experts.152.gate_proj", "model.layers.79.mlp.experts.153.gate_proj", "model.layers.79.mlp.experts.154.gate_proj", "model.layers.79.mlp.experts.155.gate_proj", "model.layers.79.mlp.experts.156.gate_proj", "model.layers.79.mlp.experts.157.gate_proj", "model.layers.79.mlp.experts.158.gate_proj", "model.layers.79.mlp.experts.159.gate_proj", "model.layers.79.mlp.experts.0.up_proj", "model.layers.79.mlp.experts.1.up_proj", "model.layers.79.mlp.experts.2.up_proj", "model.layers.79.mlp.experts.3.up_proj", "model.layers.79.mlp.experts.4.up_proj", "model.layers.79.mlp.experts.5.up_proj", "model.layers.79.mlp.experts.6.up_proj", "model.layers.79.mlp.experts.7.up_proj", "model.layers.79.mlp.experts.8.up_proj", "model.layers.79.mlp.experts.9.up_proj", "model.layers.79.mlp.experts.10.up_proj", "model.layers.79.mlp.experts.11.up_proj", "model.layers.79.mlp.experts.12.up_proj", "model.layers.79.mlp.experts.13.up_proj", "model.layers.79.mlp.experts.14.up_proj", "model.layers.79.mlp.experts.15.up_proj", "model.layers.79.mlp.experts.16.up_proj", "model.layers.79.mlp.experts.17.up_proj", "model.layers.79.mlp.experts.18.up_proj", "model.layers.79.mlp.experts.19.up_proj", "model.layers.79.mlp.experts.20.up_proj", "model.layers.79.mlp.experts.21.up_proj", "model.layers.79.mlp.experts.22.up_proj", "model.layers.79.mlp.experts.23.up_proj", "model.layers.79.mlp.experts.24.up_proj", "model.layers.79.mlp.experts.25.up_proj", "model.layers.79.mlp.experts.26.up_proj", "model.layers.79.mlp.experts.27.up_proj", "model.layers.79.mlp.experts.28.up_proj", "model.layers.79.mlp.experts.29.up_proj", "model.layers.79.mlp.experts.30.up_proj", "model.layers.79.mlp.experts.31.up_proj", "model.layers.79.mlp.experts.32.up_proj", "model.layers.79.mlp.experts.33.up_proj", "model.layers.79.mlp.experts.34.up_proj", "model.layers.79.mlp.experts.35.up_proj", "model.layers.79.mlp.experts.36.up_proj", "model.layers.79.mlp.experts.37.up_proj", "model.layers.79.mlp.experts.38.up_proj", "model.layers.79.mlp.experts.39.up_proj", "model.layers.79.mlp.experts.40.up_proj", "model.layers.79.mlp.experts.41.up_proj", "model.layers.79.mlp.experts.42.up_proj", "model.layers.79.mlp.experts.43.up_proj", "model.layers.79.mlp.experts.44.up_proj", "model.layers.79.mlp.experts.45.up_proj", "model.layers.79.mlp.experts.46.up_proj", "model.layers.79.mlp.experts.47.up_proj", "model.layers.79.mlp.experts.48.up_proj", "model.layers.79.mlp.experts.49.up_proj", "model.layers.79.mlp.experts.50.up_proj", "model.layers.79.mlp.experts.51.up_proj", "model.layers.79.mlp.experts.52.up_proj", "model.layers.79.mlp.experts.53.up_proj", "model.layers.79.mlp.experts.54.up_proj", "model.layers.79.mlp.experts.55.up_proj", "model.layers.79.mlp.experts.56.up_proj", "model.layers.79.mlp.experts.57.up_proj", "model.layers.79.mlp.experts.58.up_proj", "model.layers.79.mlp.experts.59.up_proj", "model.layers.79.mlp.experts.60.up_proj", "model.layers.79.mlp.experts.61.up_proj", "model.layers.79.mlp.experts.62.up_proj", "model.layers.79.mlp.experts.63.up_proj", "model.layers.79.mlp.experts.64.up_proj", "model.layers.79.mlp.experts.65.up_proj", "model.layers.79.mlp.experts.66.up_proj", "model.layers.79.mlp.experts.67.up_proj", "model.layers.79.mlp.experts.68.up_proj", "model.layers.79.mlp.experts.69.up_proj", "model.layers.79.mlp.experts.70.up_proj", "model.layers.79.mlp.experts.71.up_proj", "model.layers.79.mlp.experts.72.up_proj", "model.layers.79.mlp.experts.73.up_proj", "model.layers.79.mlp.experts.74.up_proj", "model.layers.79.mlp.experts.75.up_proj", "model.layers.79.mlp.experts.76.up_proj", "model.layers.79.mlp.experts.77.up_proj", "model.layers.79.mlp.experts.78.up_proj", "model.layers.79.mlp.experts.79.up_proj", "model.layers.79.mlp.experts.80.up_proj", "model.layers.79.mlp.experts.81.up_proj", "model.layers.79.mlp.experts.82.up_proj", "model.layers.79.mlp.experts.83.up_proj", "model.layers.79.mlp.experts.84.up_proj", "model.layers.79.mlp.experts.85.up_proj", "model.layers.79.mlp.experts.86.up_proj", "model.layers.79.mlp.experts.87.up_proj", "model.layers.79.mlp.experts.88.up_proj", "model.layers.79.mlp.experts.89.up_proj", "model.layers.79.mlp.experts.90.up_proj", "model.layers.79.mlp.experts.91.up_proj", "model.layers.79.mlp.experts.92.up_proj", "model.layers.79.mlp.experts.93.up_proj", "model.layers.79.mlp.experts.94.up_proj", "model.layers.79.mlp.experts.95.up_proj", "model.layers.79.mlp.experts.96.up_proj", "model.layers.79.mlp.experts.97.up_proj", "model.layers.79.mlp.experts.98.up_proj", "model.layers.79.mlp.experts.99.up_proj", "model.layers.79.mlp.experts.100.up_proj", "model.layers.79.mlp.experts.101.up_proj", "model.layers.79.mlp.experts.102.up_proj", "model.layers.79.mlp.experts.103.up_proj", "model.layers.79.mlp.experts.104.up_proj", "model.layers.79.mlp.experts.105.up_proj", "model.layers.79.mlp.experts.106.up_proj", "model.layers.79.mlp.experts.107.up_proj", "model.layers.79.mlp.experts.108.up_proj", "model.layers.79.mlp.experts.109.up_proj", "model.layers.79.mlp.experts.110.up_proj", "model.layers.79.mlp.experts.111.up_proj", "model.layers.79.mlp.experts.112.up_proj", "model.layers.79.mlp.experts.113.up_proj", "model.layers.79.mlp.experts.114.up_proj", "model.layers.79.mlp.experts.115.up_proj", "model.layers.79.mlp.experts.116.up_proj", "model.layers.79.mlp.experts.117.up_proj", "model.layers.79.mlp.experts.118.up_proj", "model.layers.79.mlp.experts.119.up_proj", "model.layers.79.mlp.experts.120.up_proj", "model.layers.79.mlp.experts.121.up_proj", "model.layers.79.mlp.experts.122.up_proj", "model.layers.79.mlp.experts.123.up_proj", "model.layers.79.mlp.experts.124.up_proj", "model.layers.79.mlp.experts.125.up_proj", "model.layers.79.mlp.experts.126.up_proj", "model.layers.79.mlp.experts.127.up_proj", "model.layers.79.mlp.experts.128.up_proj", "model.layers.79.mlp.experts.129.up_proj", "model.layers.79.mlp.experts.130.up_proj", "model.layers.79.mlp.experts.131.up_proj", "model.layers.79.mlp.experts.132.up_proj", "model.layers.79.mlp.experts.133.up_proj", "model.layers.79.mlp.experts.134.up_proj", "model.layers.79.mlp.experts.135.up_proj", "model.layers.79.mlp.experts.136.up_proj", "model.layers.79.mlp.experts.137.up_proj", "model.layers.79.mlp.experts.138.up_proj", "model.layers.79.mlp.experts.139.up_proj", "model.layers.79.mlp.experts.140.up_proj", "model.layers.79.mlp.experts.141.up_proj", "model.layers.79.mlp.experts.142.up_proj", "model.layers.79.mlp.experts.143.up_proj", "model.layers.79.mlp.experts.144.up_proj", "model.layers.79.mlp.experts.145.up_proj", "model.layers.79.mlp.experts.146.up_proj", "model.layers.79.mlp.experts.147.up_proj", "model.layers.79.mlp.experts.148.up_proj", "model.layers.79.mlp.experts.149.up_proj", "model.layers.79.mlp.experts.150.up_proj", "model.layers.79.mlp.experts.151.up_proj", "model.layers.79.mlp.experts.152.up_proj", "model.layers.79.mlp.experts.153.up_proj", "model.layers.79.mlp.experts.154.up_proj", "model.layers.79.mlp.experts.155.up_proj", "model.layers.79.mlp.experts.156.up_proj", "model.layers.79.mlp.experts.157.up_proj", "model.layers.79.mlp.experts.158.up_proj", "model.layers.79.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -5.9168227016924424e-05, "dbits": 2516582400 }, { "dkld": -4.960382357239654e-05, "dbits": 5033164800 } ] }, { "idx": 476, "layers": [ "model.layers.79.mlp.experts.0.down_proj", "model.layers.79.mlp.experts.1.down_proj", "model.layers.79.mlp.experts.2.down_proj", "model.layers.79.mlp.experts.3.down_proj", "model.layers.79.mlp.experts.4.down_proj", "model.layers.79.mlp.experts.5.down_proj", "model.layers.79.mlp.experts.6.down_proj", "model.layers.79.mlp.experts.7.down_proj", "model.layers.79.mlp.experts.8.down_proj", "model.layers.79.mlp.experts.9.down_proj", "model.layers.79.mlp.experts.10.down_proj", "model.layers.79.mlp.experts.11.down_proj", "model.layers.79.mlp.experts.12.down_proj", "model.layers.79.mlp.experts.13.down_proj", "model.layers.79.mlp.experts.14.down_proj", "model.layers.79.mlp.experts.15.down_proj", "model.layers.79.mlp.experts.16.down_proj", "model.layers.79.mlp.experts.17.down_proj", "model.layers.79.mlp.experts.18.down_proj", "model.layers.79.mlp.experts.19.down_proj", "model.layers.79.mlp.experts.20.down_proj", "model.layers.79.mlp.experts.21.down_proj", "model.layers.79.mlp.experts.22.down_proj", "model.layers.79.mlp.experts.23.down_proj", "model.layers.79.mlp.experts.24.down_proj", "model.layers.79.mlp.experts.25.down_proj", "model.layers.79.mlp.experts.26.down_proj", "model.layers.79.mlp.experts.27.down_proj", "model.layers.79.mlp.experts.28.down_proj", "model.layers.79.mlp.experts.29.down_proj", "model.layers.79.mlp.experts.30.down_proj", "model.layers.79.mlp.experts.31.down_proj", "model.layers.79.mlp.experts.32.down_proj", "model.layers.79.mlp.experts.33.down_proj", "model.layers.79.mlp.experts.34.down_proj", "model.layers.79.mlp.experts.35.down_proj", "model.layers.79.mlp.experts.36.down_proj", "model.layers.79.mlp.experts.37.down_proj", "model.layers.79.mlp.experts.38.down_proj", "model.layers.79.mlp.experts.39.down_proj", "model.layers.79.mlp.experts.40.down_proj", "model.layers.79.mlp.experts.41.down_proj", "model.layers.79.mlp.experts.42.down_proj", "model.layers.79.mlp.experts.43.down_proj", "model.layers.79.mlp.experts.44.down_proj", "model.layers.79.mlp.experts.45.down_proj", "model.layers.79.mlp.experts.46.down_proj", "model.layers.79.mlp.experts.47.down_proj", "model.layers.79.mlp.experts.48.down_proj", "model.layers.79.mlp.experts.49.down_proj", "model.layers.79.mlp.experts.50.down_proj", "model.layers.79.mlp.experts.51.down_proj", "model.layers.79.mlp.experts.52.down_proj", "model.layers.79.mlp.experts.53.down_proj", "model.layers.79.mlp.experts.54.down_proj", "model.layers.79.mlp.experts.55.down_proj", "model.layers.79.mlp.experts.56.down_proj", "model.layers.79.mlp.experts.57.down_proj", "model.layers.79.mlp.experts.58.down_proj", "model.layers.79.mlp.experts.59.down_proj", "model.layers.79.mlp.experts.60.down_proj", "model.layers.79.mlp.experts.61.down_proj", "model.layers.79.mlp.experts.62.down_proj", "model.layers.79.mlp.experts.63.down_proj", "model.layers.79.mlp.experts.64.down_proj", "model.layers.79.mlp.experts.65.down_proj", "model.layers.79.mlp.experts.66.down_proj", "model.layers.79.mlp.experts.67.down_proj", "model.layers.79.mlp.experts.68.down_proj", "model.layers.79.mlp.experts.69.down_proj", "model.layers.79.mlp.experts.70.down_proj", "model.layers.79.mlp.experts.71.down_proj", "model.layers.79.mlp.experts.72.down_proj", "model.layers.79.mlp.experts.73.down_proj", "model.layers.79.mlp.experts.74.down_proj", "model.layers.79.mlp.experts.75.down_proj", "model.layers.79.mlp.experts.76.down_proj", "model.layers.79.mlp.experts.77.down_proj", "model.layers.79.mlp.experts.78.down_proj", "model.layers.79.mlp.experts.79.down_proj", "model.layers.79.mlp.experts.80.down_proj", "model.layers.79.mlp.experts.81.down_proj", "model.layers.79.mlp.experts.82.down_proj", "model.layers.79.mlp.experts.83.down_proj", "model.layers.79.mlp.experts.84.down_proj", "model.layers.79.mlp.experts.85.down_proj", "model.layers.79.mlp.experts.86.down_proj", "model.layers.79.mlp.experts.87.down_proj", "model.layers.79.mlp.experts.88.down_proj", "model.layers.79.mlp.experts.89.down_proj", "model.layers.79.mlp.experts.90.down_proj", "model.layers.79.mlp.experts.91.down_proj", "model.layers.79.mlp.experts.92.down_proj", "model.layers.79.mlp.experts.93.down_proj", "model.layers.79.mlp.experts.94.down_proj", "model.layers.79.mlp.experts.95.down_proj", "model.layers.79.mlp.experts.96.down_proj", "model.layers.79.mlp.experts.97.down_proj", "model.layers.79.mlp.experts.98.down_proj", "model.layers.79.mlp.experts.99.down_proj", "model.layers.79.mlp.experts.100.down_proj", "model.layers.79.mlp.experts.101.down_proj", "model.layers.79.mlp.experts.102.down_proj", "model.layers.79.mlp.experts.103.down_proj", "model.layers.79.mlp.experts.104.down_proj", "model.layers.79.mlp.experts.105.down_proj", "model.layers.79.mlp.experts.106.down_proj", "model.layers.79.mlp.experts.107.down_proj", "model.layers.79.mlp.experts.108.down_proj", "model.layers.79.mlp.experts.109.down_proj", "model.layers.79.mlp.experts.110.down_proj", "model.layers.79.mlp.experts.111.down_proj", "model.layers.79.mlp.experts.112.down_proj", "model.layers.79.mlp.experts.113.down_proj", "model.layers.79.mlp.experts.114.down_proj", "model.layers.79.mlp.experts.115.down_proj", "model.layers.79.mlp.experts.116.down_proj", "model.layers.79.mlp.experts.117.down_proj", "model.layers.79.mlp.experts.118.down_proj", "model.layers.79.mlp.experts.119.down_proj", "model.layers.79.mlp.experts.120.down_proj", "model.layers.79.mlp.experts.121.down_proj", "model.layers.79.mlp.experts.122.down_proj", "model.layers.79.mlp.experts.123.down_proj", "model.layers.79.mlp.experts.124.down_proj", "model.layers.79.mlp.experts.125.down_proj", "model.layers.79.mlp.experts.126.down_proj", "model.layers.79.mlp.experts.127.down_proj", "model.layers.79.mlp.experts.128.down_proj", "model.layers.79.mlp.experts.129.down_proj", "model.layers.79.mlp.experts.130.down_proj", "model.layers.79.mlp.experts.131.down_proj", "model.layers.79.mlp.experts.132.down_proj", "model.layers.79.mlp.experts.133.down_proj", "model.layers.79.mlp.experts.134.down_proj", "model.layers.79.mlp.experts.135.down_proj", "model.layers.79.mlp.experts.136.down_proj", "model.layers.79.mlp.experts.137.down_proj", "model.layers.79.mlp.experts.138.down_proj", "model.layers.79.mlp.experts.139.down_proj", "model.layers.79.mlp.experts.140.down_proj", "model.layers.79.mlp.experts.141.down_proj", "model.layers.79.mlp.experts.142.down_proj", "model.layers.79.mlp.experts.143.down_proj", "model.layers.79.mlp.experts.144.down_proj", "model.layers.79.mlp.experts.145.down_proj", "model.layers.79.mlp.experts.146.down_proj", "model.layers.79.mlp.experts.147.down_proj", "model.layers.79.mlp.experts.148.down_proj", "model.layers.79.mlp.experts.149.down_proj", "model.layers.79.mlp.experts.150.down_proj", "model.layers.79.mlp.experts.151.down_proj", "model.layers.79.mlp.experts.152.down_proj", "model.layers.79.mlp.experts.153.down_proj", "model.layers.79.mlp.experts.154.down_proj", "model.layers.79.mlp.experts.155.down_proj", "model.layers.79.mlp.experts.156.down_proj", "model.layers.79.mlp.experts.157.down_proj", "model.layers.79.mlp.experts.158.down_proj", "model.layers.79.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 2.5439215824008335e-05, "dbits": 1258291200 }, { "dkld": 2.2127805277705886e-05, "dbits": 2516582400 } ] }, { "idx": 477, "layers": [ "model.layers.80.self_attn.q_proj" ], "candidates": [ { "dkld": 0.0001879401272162802, "dbits": 62914560 }, { "dkld": 7.688179612159833e-05, "dbits": 125829120 } ] }, { "idx": 478, "layers": [ "model.layers.80.self_attn.k_proj", "model.layers.80.self_attn.v_proj" ], "candidates": [ { "dkld": 5.330918356776307e-05, "dbits": 10485760 }, { "dkld": 4.703225567937591e-06, "dbits": 20971520 } ] }, { "idx": 479, "layers": [ "model.layers.80.self_attn.o_proj" ], "candidates": [ { "dkld": -1.3583805412043654e-06, "dbits": 62914560 }, { "dkld": 1.9217608496560623e-06, "dbits": 125829120 } ] }, { "idx": 480, "layers": [ "model.layers.80.mlp.shared_experts.gate_proj", "model.layers.80.mlp.shared_experts.up_proj", "model.layers.80.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -8.657420985400642e-05, "dbits": 23592960 }, { "dkld": -6.31556846201406e-05, "dbits": 47185920 } ] }, { "idx": 481, "layers": [ "model.layers.80.mlp.experts.0.gate_proj", "model.layers.80.mlp.experts.1.gate_proj", "model.layers.80.mlp.experts.2.gate_proj", "model.layers.80.mlp.experts.3.gate_proj", "model.layers.80.mlp.experts.4.gate_proj", "model.layers.80.mlp.experts.5.gate_proj", "model.layers.80.mlp.experts.6.gate_proj", "model.layers.80.mlp.experts.7.gate_proj", "model.layers.80.mlp.experts.8.gate_proj", "model.layers.80.mlp.experts.9.gate_proj", "model.layers.80.mlp.experts.10.gate_proj", "model.layers.80.mlp.experts.11.gate_proj", "model.layers.80.mlp.experts.12.gate_proj", "model.layers.80.mlp.experts.13.gate_proj", "model.layers.80.mlp.experts.14.gate_proj", "model.layers.80.mlp.experts.15.gate_proj", "model.layers.80.mlp.experts.16.gate_proj", "model.layers.80.mlp.experts.17.gate_proj", "model.layers.80.mlp.experts.18.gate_proj", "model.layers.80.mlp.experts.19.gate_proj", "model.layers.80.mlp.experts.20.gate_proj", "model.layers.80.mlp.experts.21.gate_proj", "model.layers.80.mlp.experts.22.gate_proj", "model.layers.80.mlp.experts.23.gate_proj", "model.layers.80.mlp.experts.24.gate_proj", "model.layers.80.mlp.experts.25.gate_proj", "model.layers.80.mlp.experts.26.gate_proj", "model.layers.80.mlp.experts.27.gate_proj", "model.layers.80.mlp.experts.28.gate_proj", "model.layers.80.mlp.experts.29.gate_proj", "model.layers.80.mlp.experts.30.gate_proj", "model.layers.80.mlp.experts.31.gate_proj", "model.layers.80.mlp.experts.32.gate_proj", "model.layers.80.mlp.experts.33.gate_proj", "model.layers.80.mlp.experts.34.gate_proj", "model.layers.80.mlp.experts.35.gate_proj", "model.layers.80.mlp.experts.36.gate_proj", "model.layers.80.mlp.experts.37.gate_proj", "model.layers.80.mlp.experts.38.gate_proj", "model.layers.80.mlp.experts.39.gate_proj", "model.layers.80.mlp.experts.40.gate_proj", "model.layers.80.mlp.experts.41.gate_proj", "model.layers.80.mlp.experts.42.gate_proj", "model.layers.80.mlp.experts.43.gate_proj", "model.layers.80.mlp.experts.44.gate_proj", "model.layers.80.mlp.experts.45.gate_proj", "model.layers.80.mlp.experts.46.gate_proj", "model.layers.80.mlp.experts.47.gate_proj", "model.layers.80.mlp.experts.48.gate_proj", "model.layers.80.mlp.experts.49.gate_proj", "model.layers.80.mlp.experts.50.gate_proj", "model.layers.80.mlp.experts.51.gate_proj", "model.layers.80.mlp.experts.52.gate_proj", "model.layers.80.mlp.experts.53.gate_proj", "model.layers.80.mlp.experts.54.gate_proj", "model.layers.80.mlp.experts.55.gate_proj", "model.layers.80.mlp.experts.56.gate_proj", "model.layers.80.mlp.experts.57.gate_proj", "model.layers.80.mlp.experts.58.gate_proj", "model.layers.80.mlp.experts.59.gate_proj", "model.layers.80.mlp.experts.60.gate_proj", "model.layers.80.mlp.experts.61.gate_proj", "model.layers.80.mlp.experts.62.gate_proj", "model.layers.80.mlp.experts.63.gate_proj", "model.layers.80.mlp.experts.64.gate_proj", "model.layers.80.mlp.experts.65.gate_proj", "model.layers.80.mlp.experts.66.gate_proj", "model.layers.80.mlp.experts.67.gate_proj", "model.layers.80.mlp.experts.68.gate_proj", "model.layers.80.mlp.experts.69.gate_proj", "model.layers.80.mlp.experts.70.gate_proj", "model.layers.80.mlp.experts.71.gate_proj", "model.layers.80.mlp.experts.72.gate_proj", "model.layers.80.mlp.experts.73.gate_proj", "model.layers.80.mlp.experts.74.gate_proj", "model.layers.80.mlp.experts.75.gate_proj", "model.layers.80.mlp.experts.76.gate_proj", "model.layers.80.mlp.experts.77.gate_proj", "model.layers.80.mlp.experts.78.gate_proj", "model.layers.80.mlp.experts.79.gate_proj", "model.layers.80.mlp.experts.80.gate_proj", "model.layers.80.mlp.experts.81.gate_proj", "model.layers.80.mlp.experts.82.gate_proj", "model.layers.80.mlp.experts.83.gate_proj", "model.layers.80.mlp.experts.84.gate_proj", "model.layers.80.mlp.experts.85.gate_proj", "model.layers.80.mlp.experts.86.gate_proj", "model.layers.80.mlp.experts.87.gate_proj", "model.layers.80.mlp.experts.88.gate_proj", "model.layers.80.mlp.experts.89.gate_proj", "model.layers.80.mlp.experts.90.gate_proj", "model.layers.80.mlp.experts.91.gate_proj", "model.layers.80.mlp.experts.92.gate_proj", "model.layers.80.mlp.experts.93.gate_proj", "model.layers.80.mlp.experts.94.gate_proj", "model.layers.80.mlp.experts.95.gate_proj", "model.layers.80.mlp.experts.96.gate_proj", "model.layers.80.mlp.experts.97.gate_proj", "model.layers.80.mlp.experts.98.gate_proj", "model.layers.80.mlp.experts.99.gate_proj", "model.layers.80.mlp.experts.100.gate_proj", "model.layers.80.mlp.experts.101.gate_proj", "model.layers.80.mlp.experts.102.gate_proj", "model.layers.80.mlp.experts.103.gate_proj", "model.layers.80.mlp.experts.104.gate_proj", "model.layers.80.mlp.experts.105.gate_proj", "model.layers.80.mlp.experts.106.gate_proj", "model.layers.80.mlp.experts.107.gate_proj", "model.layers.80.mlp.experts.108.gate_proj", "model.layers.80.mlp.experts.109.gate_proj", "model.layers.80.mlp.experts.110.gate_proj", "model.layers.80.mlp.experts.111.gate_proj", "model.layers.80.mlp.experts.112.gate_proj", "model.layers.80.mlp.experts.113.gate_proj", "model.layers.80.mlp.experts.114.gate_proj", "model.layers.80.mlp.experts.115.gate_proj", "model.layers.80.mlp.experts.116.gate_proj", "model.layers.80.mlp.experts.117.gate_proj", "model.layers.80.mlp.experts.118.gate_proj", "model.layers.80.mlp.experts.119.gate_proj", "model.layers.80.mlp.experts.120.gate_proj", "model.layers.80.mlp.experts.121.gate_proj", "model.layers.80.mlp.experts.122.gate_proj", "model.layers.80.mlp.experts.123.gate_proj", "model.layers.80.mlp.experts.124.gate_proj", "model.layers.80.mlp.experts.125.gate_proj", "model.layers.80.mlp.experts.126.gate_proj", "model.layers.80.mlp.experts.127.gate_proj", "model.layers.80.mlp.experts.128.gate_proj", "model.layers.80.mlp.experts.129.gate_proj", "model.layers.80.mlp.experts.130.gate_proj", "model.layers.80.mlp.experts.131.gate_proj", "model.layers.80.mlp.experts.132.gate_proj", "model.layers.80.mlp.experts.133.gate_proj", "model.layers.80.mlp.experts.134.gate_proj", "model.layers.80.mlp.experts.135.gate_proj", "model.layers.80.mlp.experts.136.gate_proj", "model.layers.80.mlp.experts.137.gate_proj", "model.layers.80.mlp.experts.138.gate_proj", "model.layers.80.mlp.experts.139.gate_proj", "model.layers.80.mlp.experts.140.gate_proj", "model.layers.80.mlp.experts.141.gate_proj", "model.layers.80.mlp.experts.142.gate_proj", "model.layers.80.mlp.experts.143.gate_proj", "model.layers.80.mlp.experts.144.gate_proj", "model.layers.80.mlp.experts.145.gate_proj", "model.layers.80.mlp.experts.146.gate_proj", "model.layers.80.mlp.experts.147.gate_proj", "model.layers.80.mlp.experts.148.gate_proj", "model.layers.80.mlp.experts.149.gate_proj", "model.layers.80.mlp.experts.150.gate_proj", "model.layers.80.mlp.experts.151.gate_proj", "model.layers.80.mlp.experts.152.gate_proj", "model.layers.80.mlp.experts.153.gate_proj", "model.layers.80.mlp.experts.154.gate_proj", "model.layers.80.mlp.experts.155.gate_proj", "model.layers.80.mlp.experts.156.gate_proj", "model.layers.80.mlp.experts.157.gate_proj", "model.layers.80.mlp.experts.158.gate_proj", "model.layers.80.mlp.experts.159.gate_proj", "model.layers.80.mlp.experts.0.up_proj", "model.layers.80.mlp.experts.1.up_proj", "model.layers.80.mlp.experts.2.up_proj", "model.layers.80.mlp.experts.3.up_proj", "model.layers.80.mlp.experts.4.up_proj", "model.layers.80.mlp.experts.5.up_proj", "model.layers.80.mlp.experts.6.up_proj", "model.layers.80.mlp.experts.7.up_proj", "model.layers.80.mlp.experts.8.up_proj", "model.layers.80.mlp.experts.9.up_proj", "model.layers.80.mlp.experts.10.up_proj", "model.layers.80.mlp.experts.11.up_proj", "model.layers.80.mlp.experts.12.up_proj", "model.layers.80.mlp.experts.13.up_proj", "model.layers.80.mlp.experts.14.up_proj", "model.layers.80.mlp.experts.15.up_proj", "model.layers.80.mlp.experts.16.up_proj", "model.layers.80.mlp.experts.17.up_proj", "model.layers.80.mlp.experts.18.up_proj", "model.layers.80.mlp.experts.19.up_proj", "model.layers.80.mlp.experts.20.up_proj", "model.layers.80.mlp.experts.21.up_proj", "model.layers.80.mlp.experts.22.up_proj", "model.layers.80.mlp.experts.23.up_proj", "model.layers.80.mlp.experts.24.up_proj", "model.layers.80.mlp.experts.25.up_proj", "model.layers.80.mlp.experts.26.up_proj", "model.layers.80.mlp.experts.27.up_proj", "model.layers.80.mlp.experts.28.up_proj", "model.layers.80.mlp.experts.29.up_proj", "model.layers.80.mlp.experts.30.up_proj", "model.layers.80.mlp.experts.31.up_proj", "model.layers.80.mlp.experts.32.up_proj", "model.layers.80.mlp.experts.33.up_proj", "model.layers.80.mlp.experts.34.up_proj", "model.layers.80.mlp.experts.35.up_proj", "model.layers.80.mlp.experts.36.up_proj", "model.layers.80.mlp.experts.37.up_proj", "model.layers.80.mlp.experts.38.up_proj", "model.layers.80.mlp.experts.39.up_proj", "model.layers.80.mlp.experts.40.up_proj", "model.layers.80.mlp.experts.41.up_proj", "model.layers.80.mlp.experts.42.up_proj", "model.layers.80.mlp.experts.43.up_proj", "model.layers.80.mlp.experts.44.up_proj", "model.layers.80.mlp.experts.45.up_proj", "model.layers.80.mlp.experts.46.up_proj", "model.layers.80.mlp.experts.47.up_proj", "model.layers.80.mlp.experts.48.up_proj", "model.layers.80.mlp.experts.49.up_proj", "model.layers.80.mlp.experts.50.up_proj", "model.layers.80.mlp.experts.51.up_proj", "model.layers.80.mlp.experts.52.up_proj", "model.layers.80.mlp.experts.53.up_proj", "model.layers.80.mlp.experts.54.up_proj", "model.layers.80.mlp.experts.55.up_proj", "model.layers.80.mlp.experts.56.up_proj", "model.layers.80.mlp.experts.57.up_proj", "model.layers.80.mlp.experts.58.up_proj", "model.layers.80.mlp.experts.59.up_proj", "model.layers.80.mlp.experts.60.up_proj", "model.layers.80.mlp.experts.61.up_proj", "model.layers.80.mlp.experts.62.up_proj", "model.layers.80.mlp.experts.63.up_proj", "model.layers.80.mlp.experts.64.up_proj", "model.layers.80.mlp.experts.65.up_proj", "model.layers.80.mlp.experts.66.up_proj", "model.layers.80.mlp.experts.67.up_proj", "model.layers.80.mlp.experts.68.up_proj", "model.layers.80.mlp.experts.69.up_proj", "model.layers.80.mlp.experts.70.up_proj", "model.layers.80.mlp.experts.71.up_proj", "model.layers.80.mlp.experts.72.up_proj", "model.layers.80.mlp.experts.73.up_proj", "model.layers.80.mlp.experts.74.up_proj", "model.layers.80.mlp.experts.75.up_proj", "model.layers.80.mlp.experts.76.up_proj", "model.layers.80.mlp.experts.77.up_proj", "model.layers.80.mlp.experts.78.up_proj", "model.layers.80.mlp.experts.79.up_proj", "model.layers.80.mlp.experts.80.up_proj", "model.layers.80.mlp.experts.81.up_proj", "model.layers.80.mlp.experts.82.up_proj", "model.layers.80.mlp.experts.83.up_proj", "model.layers.80.mlp.experts.84.up_proj", "model.layers.80.mlp.experts.85.up_proj", "model.layers.80.mlp.experts.86.up_proj", "model.layers.80.mlp.experts.87.up_proj", "model.layers.80.mlp.experts.88.up_proj", "model.layers.80.mlp.experts.89.up_proj", "model.layers.80.mlp.experts.90.up_proj", "model.layers.80.mlp.experts.91.up_proj", "model.layers.80.mlp.experts.92.up_proj", "model.layers.80.mlp.experts.93.up_proj", "model.layers.80.mlp.experts.94.up_proj", "model.layers.80.mlp.experts.95.up_proj", "model.layers.80.mlp.experts.96.up_proj", "model.layers.80.mlp.experts.97.up_proj", "model.layers.80.mlp.experts.98.up_proj", "model.layers.80.mlp.experts.99.up_proj", "model.layers.80.mlp.experts.100.up_proj", "model.layers.80.mlp.experts.101.up_proj", "model.layers.80.mlp.experts.102.up_proj", "model.layers.80.mlp.experts.103.up_proj", "model.layers.80.mlp.experts.104.up_proj", "model.layers.80.mlp.experts.105.up_proj", "model.layers.80.mlp.experts.106.up_proj", "model.layers.80.mlp.experts.107.up_proj", "model.layers.80.mlp.experts.108.up_proj", "model.layers.80.mlp.experts.109.up_proj", "model.layers.80.mlp.experts.110.up_proj", "model.layers.80.mlp.experts.111.up_proj", "model.layers.80.mlp.experts.112.up_proj", "model.layers.80.mlp.experts.113.up_proj", "model.layers.80.mlp.experts.114.up_proj", "model.layers.80.mlp.experts.115.up_proj", "model.layers.80.mlp.experts.116.up_proj", "model.layers.80.mlp.experts.117.up_proj", "model.layers.80.mlp.experts.118.up_proj", "model.layers.80.mlp.experts.119.up_proj", "model.layers.80.mlp.experts.120.up_proj", "model.layers.80.mlp.experts.121.up_proj", "model.layers.80.mlp.experts.122.up_proj", "model.layers.80.mlp.experts.123.up_proj", "model.layers.80.mlp.experts.124.up_proj", "model.layers.80.mlp.experts.125.up_proj", "model.layers.80.mlp.experts.126.up_proj", "model.layers.80.mlp.experts.127.up_proj", "model.layers.80.mlp.experts.128.up_proj", "model.layers.80.mlp.experts.129.up_proj", "model.layers.80.mlp.experts.130.up_proj", "model.layers.80.mlp.experts.131.up_proj", "model.layers.80.mlp.experts.132.up_proj", "model.layers.80.mlp.experts.133.up_proj", "model.layers.80.mlp.experts.134.up_proj", "model.layers.80.mlp.experts.135.up_proj", "model.layers.80.mlp.experts.136.up_proj", "model.layers.80.mlp.experts.137.up_proj", "model.layers.80.mlp.experts.138.up_proj", "model.layers.80.mlp.experts.139.up_proj", "model.layers.80.mlp.experts.140.up_proj", "model.layers.80.mlp.experts.141.up_proj", "model.layers.80.mlp.experts.142.up_proj", "model.layers.80.mlp.experts.143.up_proj", "model.layers.80.mlp.experts.144.up_proj", "model.layers.80.mlp.experts.145.up_proj", "model.layers.80.mlp.experts.146.up_proj", "model.layers.80.mlp.experts.147.up_proj", "model.layers.80.mlp.experts.148.up_proj", "model.layers.80.mlp.experts.149.up_proj", "model.layers.80.mlp.experts.150.up_proj", "model.layers.80.mlp.experts.151.up_proj", "model.layers.80.mlp.experts.152.up_proj", "model.layers.80.mlp.experts.153.up_proj", "model.layers.80.mlp.experts.154.up_proj", "model.layers.80.mlp.experts.155.up_proj", "model.layers.80.mlp.experts.156.up_proj", "model.layers.80.mlp.experts.157.up_proj", "model.layers.80.mlp.experts.158.up_proj", "model.layers.80.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 6.937701255083778e-06, "dbits": 2516582400 }, { "dkld": 3.287033177912929e-06, "dbits": 5033164800 } ] }, { "idx": 482, "layers": [ "model.layers.80.mlp.experts.0.down_proj", "model.layers.80.mlp.experts.1.down_proj", "model.layers.80.mlp.experts.2.down_proj", "model.layers.80.mlp.experts.3.down_proj", "model.layers.80.mlp.experts.4.down_proj", "model.layers.80.mlp.experts.5.down_proj", "model.layers.80.mlp.experts.6.down_proj", "model.layers.80.mlp.experts.7.down_proj", "model.layers.80.mlp.experts.8.down_proj", "model.layers.80.mlp.experts.9.down_proj", "model.layers.80.mlp.experts.10.down_proj", "model.layers.80.mlp.experts.11.down_proj", "model.layers.80.mlp.experts.12.down_proj", "model.layers.80.mlp.experts.13.down_proj", "model.layers.80.mlp.experts.14.down_proj", "model.layers.80.mlp.experts.15.down_proj", "model.layers.80.mlp.experts.16.down_proj", "model.layers.80.mlp.experts.17.down_proj", "model.layers.80.mlp.experts.18.down_proj", "model.layers.80.mlp.experts.19.down_proj", "model.layers.80.mlp.experts.20.down_proj", "model.layers.80.mlp.experts.21.down_proj", "model.layers.80.mlp.experts.22.down_proj", "model.layers.80.mlp.experts.23.down_proj", "model.layers.80.mlp.experts.24.down_proj", "model.layers.80.mlp.experts.25.down_proj", "model.layers.80.mlp.experts.26.down_proj", "model.layers.80.mlp.experts.27.down_proj", "model.layers.80.mlp.experts.28.down_proj", "model.layers.80.mlp.experts.29.down_proj", "model.layers.80.mlp.experts.30.down_proj", "model.layers.80.mlp.experts.31.down_proj", "model.layers.80.mlp.experts.32.down_proj", "model.layers.80.mlp.experts.33.down_proj", "model.layers.80.mlp.experts.34.down_proj", "model.layers.80.mlp.experts.35.down_proj", "model.layers.80.mlp.experts.36.down_proj", "model.layers.80.mlp.experts.37.down_proj", "model.layers.80.mlp.experts.38.down_proj", "model.layers.80.mlp.experts.39.down_proj", "model.layers.80.mlp.experts.40.down_proj", "model.layers.80.mlp.experts.41.down_proj", "model.layers.80.mlp.experts.42.down_proj", "model.layers.80.mlp.experts.43.down_proj", "model.layers.80.mlp.experts.44.down_proj", "model.layers.80.mlp.experts.45.down_proj", "model.layers.80.mlp.experts.46.down_proj", "model.layers.80.mlp.experts.47.down_proj", "model.layers.80.mlp.experts.48.down_proj", "model.layers.80.mlp.experts.49.down_proj", "model.layers.80.mlp.experts.50.down_proj", "model.layers.80.mlp.experts.51.down_proj", "model.layers.80.mlp.experts.52.down_proj", "model.layers.80.mlp.experts.53.down_proj", "model.layers.80.mlp.experts.54.down_proj", "model.layers.80.mlp.experts.55.down_proj", "model.layers.80.mlp.experts.56.down_proj", "model.layers.80.mlp.experts.57.down_proj", "model.layers.80.mlp.experts.58.down_proj", "model.layers.80.mlp.experts.59.down_proj", "model.layers.80.mlp.experts.60.down_proj", "model.layers.80.mlp.experts.61.down_proj", "model.layers.80.mlp.experts.62.down_proj", "model.layers.80.mlp.experts.63.down_proj", "model.layers.80.mlp.experts.64.down_proj", "model.layers.80.mlp.experts.65.down_proj", "model.layers.80.mlp.experts.66.down_proj", "model.layers.80.mlp.experts.67.down_proj", "model.layers.80.mlp.experts.68.down_proj", "model.layers.80.mlp.experts.69.down_proj", "model.layers.80.mlp.experts.70.down_proj", "model.layers.80.mlp.experts.71.down_proj", "model.layers.80.mlp.experts.72.down_proj", "model.layers.80.mlp.experts.73.down_proj", "model.layers.80.mlp.experts.74.down_proj", "model.layers.80.mlp.experts.75.down_proj", "model.layers.80.mlp.experts.76.down_proj", "model.layers.80.mlp.experts.77.down_proj", "model.layers.80.mlp.experts.78.down_proj", "model.layers.80.mlp.experts.79.down_proj", "model.layers.80.mlp.experts.80.down_proj", "model.layers.80.mlp.experts.81.down_proj", "model.layers.80.mlp.experts.82.down_proj", "model.layers.80.mlp.experts.83.down_proj", "model.layers.80.mlp.experts.84.down_proj", "model.layers.80.mlp.experts.85.down_proj", "model.layers.80.mlp.experts.86.down_proj", "model.layers.80.mlp.experts.87.down_proj", "model.layers.80.mlp.experts.88.down_proj", "model.layers.80.mlp.experts.89.down_proj", "model.layers.80.mlp.experts.90.down_proj", "model.layers.80.mlp.experts.91.down_proj", "model.layers.80.mlp.experts.92.down_proj", "model.layers.80.mlp.experts.93.down_proj", "model.layers.80.mlp.experts.94.down_proj", "model.layers.80.mlp.experts.95.down_proj", "model.layers.80.mlp.experts.96.down_proj", "model.layers.80.mlp.experts.97.down_proj", "model.layers.80.mlp.experts.98.down_proj", "model.layers.80.mlp.experts.99.down_proj", "model.layers.80.mlp.experts.100.down_proj", "model.layers.80.mlp.experts.101.down_proj", "model.layers.80.mlp.experts.102.down_proj", "model.layers.80.mlp.experts.103.down_proj", "model.layers.80.mlp.experts.104.down_proj", "model.layers.80.mlp.experts.105.down_proj", "model.layers.80.mlp.experts.106.down_proj", "model.layers.80.mlp.experts.107.down_proj", "model.layers.80.mlp.experts.108.down_proj", "model.layers.80.mlp.experts.109.down_proj", "model.layers.80.mlp.experts.110.down_proj", "model.layers.80.mlp.experts.111.down_proj", "model.layers.80.mlp.experts.112.down_proj", "model.layers.80.mlp.experts.113.down_proj", "model.layers.80.mlp.experts.114.down_proj", "model.layers.80.mlp.experts.115.down_proj", "model.layers.80.mlp.experts.116.down_proj", "model.layers.80.mlp.experts.117.down_proj", "model.layers.80.mlp.experts.118.down_proj", "model.layers.80.mlp.experts.119.down_proj", "model.layers.80.mlp.experts.120.down_proj", "model.layers.80.mlp.experts.121.down_proj", "model.layers.80.mlp.experts.122.down_proj", "model.layers.80.mlp.experts.123.down_proj", "model.layers.80.mlp.experts.124.down_proj", "model.layers.80.mlp.experts.125.down_proj", "model.layers.80.mlp.experts.126.down_proj", "model.layers.80.mlp.experts.127.down_proj", "model.layers.80.mlp.experts.128.down_proj", "model.layers.80.mlp.experts.129.down_proj", "model.layers.80.mlp.experts.130.down_proj", "model.layers.80.mlp.experts.131.down_proj", "model.layers.80.mlp.experts.132.down_proj", "model.layers.80.mlp.experts.133.down_proj", "model.layers.80.mlp.experts.134.down_proj", "model.layers.80.mlp.experts.135.down_proj", "model.layers.80.mlp.experts.136.down_proj", "model.layers.80.mlp.experts.137.down_proj", "model.layers.80.mlp.experts.138.down_proj", "model.layers.80.mlp.experts.139.down_proj", "model.layers.80.mlp.experts.140.down_proj", "model.layers.80.mlp.experts.141.down_proj", "model.layers.80.mlp.experts.142.down_proj", "model.layers.80.mlp.experts.143.down_proj", "model.layers.80.mlp.experts.144.down_proj", "model.layers.80.mlp.experts.145.down_proj", "model.layers.80.mlp.experts.146.down_proj", "model.layers.80.mlp.experts.147.down_proj", "model.layers.80.mlp.experts.148.down_proj", "model.layers.80.mlp.experts.149.down_proj", "model.layers.80.mlp.experts.150.down_proj", "model.layers.80.mlp.experts.151.down_proj", "model.layers.80.mlp.experts.152.down_proj", "model.layers.80.mlp.experts.153.down_proj", "model.layers.80.mlp.experts.154.down_proj", "model.layers.80.mlp.experts.155.down_proj", "model.layers.80.mlp.experts.156.down_proj", "model.layers.80.mlp.experts.157.down_proj", "model.layers.80.mlp.experts.158.down_proj", "model.layers.80.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -4.875287413596066e-06, "dbits": 1258291200 }, { "dkld": -9.660352952777992e-06, "dbits": 2516582400 } ] }, { "idx": 483, "layers": [ "model.layers.81.self_attn.q_proj" ], "candidates": [ { "dkld": 8.721370249986649e-05, "dbits": 62914560 }, { "dkld": 4.344298504293034e-05, "dbits": 125829120 } ] }, { "idx": 484, "layers": [ "model.layers.81.self_attn.k_proj", "model.layers.81.self_attn.v_proj" ], "candidates": [ { "dkld": 4.576928913593327e-05, "dbits": 10485760 }, { "dkld": 5.88299473747618e-05, "dbits": 20971520 } ] }, { "idx": 485, "layers": [ "model.layers.81.self_attn.o_proj" ], "candidates": [ { "dkld": -1.5268428251146923e-05, "dbits": 62914560 }, { "dkld": -2.3640342988073826e-05, "dbits": 125829120 } ] }, { "idx": 486, "layers": [ "model.layers.81.mlp.shared_experts.gate_proj", "model.layers.81.mlp.shared_experts.up_proj", "model.layers.81.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -2.2236118093132626e-05, "dbits": 23592960 }, { "dkld": -5.7627703063188596e-05, "dbits": 47185920 } ] }, { "idx": 487, "layers": [ "model.layers.81.mlp.experts.0.gate_proj", "model.layers.81.mlp.experts.1.gate_proj", "model.layers.81.mlp.experts.2.gate_proj", "model.layers.81.mlp.experts.3.gate_proj", "model.layers.81.mlp.experts.4.gate_proj", "model.layers.81.mlp.experts.5.gate_proj", "model.layers.81.mlp.experts.6.gate_proj", "model.layers.81.mlp.experts.7.gate_proj", "model.layers.81.mlp.experts.8.gate_proj", "model.layers.81.mlp.experts.9.gate_proj", "model.layers.81.mlp.experts.10.gate_proj", "model.layers.81.mlp.experts.11.gate_proj", "model.layers.81.mlp.experts.12.gate_proj", "model.layers.81.mlp.experts.13.gate_proj", "model.layers.81.mlp.experts.14.gate_proj", "model.layers.81.mlp.experts.15.gate_proj", "model.layers.81.mlp.experts.16.gate_proj", "model.layers.81.mlp.experts.17.gate_proj", "model.layers.81.mlp.experts.18.gate_proj", "model.layers.81.mlp.experts.19.gate_proj", "model.layers.81.mlp.experts.20.gate_proj", "model.layers.81.mlp.experts.21.gate_proj", "model.layers.81.mlp.experts.22.gate_proj", "model.layers.81.mlp.experts.23.gate_proj", "model.layers.81.mlp.experts.24.gate_proj", "model.layers.81.mlp.experts.25.gate_proj", "model.layers.81.mlp.experts.26.gate_proj", "model.layers.81.mlp.experts.27.gate_proj", "model.layers.81.mlp.experts.28.gate_proj", "model.layers.81.mlp.experts.29.gate_proj", "model.layers.81.mlp.experts.30.gate_proj", "model.layers.81.mlp.experts.31.gate_proj", "model.layers.81.mlp.experts.32.gate_proj", "model.layers.81.mlp.experts.33.gate_proj", "model.layers.81.mlp.experts.34.gate_proj", "model.layers.81.mlp.experts.35.gate_proj", "model.layers.81.mlp.experts.36.gate_proj", "model.layers.81.mlp.experts.37.gate_proj", "model.layers.81.mlp.experts.38.gate_proj", "model.layers.81.mlp.experts.39.gate_proj", "model.layers.81.mlp.experts.40.gate_proj", "model.layers.81.mlp.experts.41.gate_proj", "model.layers.81.mlp.experts.42.gate_proj", "model.layers.81.mlp.experts.43.gate_proj", "model.layers.81.mlp.experts.44.gate_proj", "model.layers.81.mlp.experts.45.gate_proj", "model.layers.81.mlp.experts.46.gate_proj", "model.layers.81.mlp.experts.47.gate_proj", "model.layers.81.mlp.experts.48.gate_proj", "model.layers.81.mlp.experts.49.gate_proj", "model.layers.81.mlp.experts.50.gate_proj", "model.layers.81.mlp.experts.51.gate_proj", "model.layers.81.mlp.experts.52.gate_proj", "model.layers.81.mlp.experts.53.gate_proj", "model.layers.81.mlp.experts.54.gate_proj", "model.layers.81.mlp.experts.55.gate_proj", "model.layers.81.mlp.experts.56.gate_proj", "model.layers.81.mlp.experts.57.gate_proj", "model.layers.81.mlp.experts.58.gate_proj", "model.layers.81.mlp.experts.59.gate_proj", "model.layers.81.mlp.experts.60.gate_proj", "model.layers.81.mlp.experts.61.gate_proj", "model.layers.81.mlp.experts.62.gate_proj", "model.layers.81.mlp.experts.63.gate_proj", "model.layers.81.mlp.experts.64.gate_proj", "model.layers.81.mlp.experts.65.gate_proj", "model.layers.81.mlp.experts.66.gate_proj", "model.layers.81.mlp.experts.67.gate_proj", "model.layers.81.mlp.experts.68.gate_proj", "model.layers.81.mlp.experts.69.gate_proj", "model.layers.81.mlp.experts.70.gate_proj", "model.layers.81.mlp.experts.71.gate_proj", "model.layers.81.mlp.experts.72.gate_proj", "model.layers.81.mlp.experts.73.gate_proj", "model.layers.81.mlp.experts.74.gate_proj", "model.layers.81.mlp.experts.75.gate_proj", "model.layers.81.mlp.experts.76.gate_proj", "model.layers.81.mlp.experts.77.gate_proj", "model.layers.81.mlp.experts.78.gate_proj", "model.layers.81.mlp.experts.79.gate_proj", "model.layers.81.mlp.experts.80.gate_proj", "model.layers.81.mlp.experts.81.gate_proj", "model.layers.81.mlp.experts.82.gate_proj", "model.layers.81.mlp.experts.83.gate_proj", "model.layers.81.mlp.experts.84.gate_proj", "model.layers.81.mlp.experts.85.gate_proj", "model.layers.81.mlp.experts.86.gate_proj", "model.layers.81.mlp.experts.87.gate_proj", "model.layers.81.mlp.experts.88.gate_proj", "model.layers.81.mlp.experts.89.gate_proj", "model.layers.81.mlp.experts.90.gate_proj", "model.layers.81.mlp.experts.91.gate_proj", "model.layers.81.mlp.experts.92.gate_proj", "model.layers.81.mlp.experts.93.gate_proj", "model.layers.81.mlp.experts.94.gate_proj", "model.layers.81.mlp.experts.95.gate_proj", "model.layers.81.mlp.experts.96.gate_proj", "model.layers.81.mlp.experts.97.gate_proj", "model.layers.81.mlp.experts.98.gate_proj", "model.layers.81.mlp.experts.99.gate_proj", "model.layers.81.mlp.experts.100.gate_proj", "model.layers.81.mlp.experts.101.gate_proj", "model.layers.81.mlp.experts.102.gate_proj", "model.layers.81.mlp.experts.103.gate_proj", "model.layers.81.mlp.experts.104.gate_proj", "model.layers.81.mlp.experts.105.gate_proj", "model.layers.81.mlp.experts.106.gate_proj", "model.layers.81.mlp.experts.107.gate_proj", "model.layers.81.mlp.experts.108.gate_proj", "model.layers.81.mlp.experts.109.gate_proj", "model.layers.81.mlp.experts.110.gate_proj", "model.layers.81.mlp.experts.111.gate_proj", "model.layers.81.mlp.experts.112.gate_proj", "model.layers.81.mlp.experts.113.gate_proj", "model.layers.81.mlp.experts.114.gate_proj", "model.layers.81.mlp.experts.115.gate_proj", "model.layers.81.mlp.experts.116.gate_proj", "model.layers.81.mlp.experts.117.gate_proj", "model.layers.81.mlp.experts.118.gate_proj", "model.layers.81.mlp.experts.119.gate_proj", "model.layers.81.mlp.experts.120.gate_proj", "model.layers.81.mlp.experts.121.gate_proj", "model.layers.81.mlp.experts.122.gate_proj", "model.layers.81.mlp.experts.123.gate_proj", "model.layers.81.mlp.experts.124.gate_proj", "model.layers.81.mlp.experts.125.gate_proj", "model.layers.81.mlp.experts.126.gate_proj", "model.layers.81.mlp.experts.127.gate_proj", "model.layers.81.mlp.experts.128.gate_proj", "model.layers.81.mlp.experts.129.gate_proj", "model.layers.81.mlp.experts.130.gate_proj", "model.layers.81.mlp.experts.131.gate_proj", "model.layers.81.mlp.experts.132.gate_proj", "model.layers.81.mlp.experts.133.gate_proj", "model.layers.81.mlp.experts.134.gate_proj", "model.layers.81.mlp.experts.135.gate_proj", "model.layers.81.mlp.experts.136.gate_proj", "model.layers.81.mlp.experts.137.gate_proj", "model.layers.81.mlp.experts.138.gate_proj", "model.layers.81.mlp.experts.139.gate_proj", "model.layers.81.mlp.experts.140.gate_proj", "model.layers.81.mlp.experts.141.gate_proj", "model.layers.81.mlp.experts.142.gate_proj", "model.layers.81.mlp.experts.143.gate_proj", "model.layers.81.mlp.experts.144.gate_proj", "model.layers.81.mlp.experts.145.gate_proj", "model.layers.81.mlp.experts.146.gate_proj", "model.layers.81.mlp.experts.147.gate_proj", "model.layers.81.mlp.experts.148.gate_proj", "model.layers.81.mlp.experts.149.gate_proj", "model.layers.81.mlp.experts.150.gate_proj", "model.layers.81.mlp.experts.151.gate_proj", "model.layers.81.mlp.experts.152.gate_proj", "model.layers.81.mlp.experts.153.gate_proj", "model.layers.81.mlp.experts.154.gate_proj", "model.layers.81.mlp.experts.155.gate_proj", "model.layers.81.mlp.experts.156.gate_proj", "model.layers.81.mlp.experts.157.gate_proj", "model.layers.81.mlp.experts.158.gate_proj", "model.layers.81.mlp.experts.159.gate_proj", "model.layers.81.mlp.experts.0.up_proj", "model.layers.81.mlp.experts.1.up_proj", "model.layers.81.mlp.experts.2.up_proj", "model.layers.81.mlp.experts.3.up_proj", "model.layers.81.mlp.experts.4.up_proj", "model.layers.81.mlp.experts.5.up_proj", "model.layers.81.mlp.experts.6.up_proj", "model.layers.81.mlp.experts.7.up_proj", "model.layers.81.mlp.experts.8.up_proj", "model.layers.81.mlp.experts.9.up_proj", "model.layers.81.mlp.experts.10.up_proj", "model.layers.81.mlp.experts.11.up_proj", "model.layers.81.mlp.experts.12.up_proj", "model.layers.81.mlp.experts.13.up_proj", "model.layers.81.mlp.experts.14.up_proj", "model.layers.81.mlp.experts.15.up_proj", "model.layers.81.mlp.experts.16.up_proj", "model.layers.81.mlp.experts.17.up_proj", "model.layers.81.mlp.experts.18.up_proj", "model.layers.81.mlp.experts.19.up_proj", "model.layers.81.mlp.experts.20.up_proj", "model.layers.81.mlp.experts.21.up_proj", "model.layers.81.mlp.experts.22.up_proj", "model.layers.81.mlp.experts.23.up_proj", "model.layers.81.mlp.experts.24.up_proj", "model.layers.81.mlp.experts.25.up_proj", "model.layers.81.mlp.experts.26.up_proj", "model.layers.81.mlp.experts.27.up_proj", "model.layers.81.mlp.experts.28.up_proj", "model.layers.81.mlp.experts.29.up_proj", "model.layers.81.mlp.experts.30.up_proj", "model.layers.81.mlp.experts.31.up_proj", "model.layers.81.mlp.experts.32.up_proj", "model.layers.81.mlp.experts.33.up_proj", "model.layers.81.mlp.experts.34.up_proj", "model.layers.81.mlp.experts.35.up_proj", "model.layers.81.mlp.experts.36.up_proj", "model.layers.81.mlp.experts.37.up_proj", "model.layers.81.mlp.experts.38.up_proj", "model.layers.81.mlp.experts.39.up_proj", "model.layers.81.mlp.experts.40.up_proj", "model.layers.81.mlp.experts.41.up_proj", "model.layers.81.mlp.experts.42.up_proj", "model.layers.81.mlp.experts.43.up_proj", "model.layers.81.mlp.experts.44.up_proj", "model.layers.81.mlp.experts.45.up_proj", "model.layers.81.mlp.experts.46.up_proj", "model.layers.81.mlp.experts.47.up_proj", "model.layers.81.mlp.experts.48.up_proj", "model.layers.81.mlp.experts.49.up_proj", "model.layers.81.mlp.experts.50.up_proj", "model.layers.81.mlp.experts.51.up_proj", "model.layers.81.mlp.experts.52.up_proj", "model.layers.81.mlp.experts.53.up_proj", "model.layers.81.mlp.experts.54.up_proj", "model.layers.81.mlp.experts.55.up_proj", "model.layers.81.mlp.experts.56.up_proj", "model.layers.81.mlp.experts.57.up_proj", "model.layers.81.mlp.experts.58.up_proj", "model.layers.81.mlp.experts.59.up_proj", "model.layers.81.mlp.experts.60.up_proj", "model.layers.81.mlp.experts.61.up_proj", "model.layers.81.mlp.experts.62.up_proj", "model.layers.81.mlp.experts.63.up_proj", "model.layers.81.mlp.experts.64.up_proj", "model.layers.81.mlp.experts.65.up_proj", "model.layers.81.mlp.experts.66.up_proj", "model.layers.81.mlp.experts.67.up_proj", "model.layers.81.mlp.experts.68.up_proj", "model.layers.81.mlp.experts.69.up_proj", "model.layers.81.mlp.experts.70.up_proj", "model.layers.81.mlp.experts.71.up_proj", "model.layers.81.mlp.experts.72.up_proj", "model.layers.81.mlp.experts.73.up_proj", "model.layers.81.mlp.experts.74.up_proj", "model.layers.81.mlp.experts.75.up_proj", "model.layers.81.mlp.experts.76.up_proj", "model.layers.81.mlp.experts.77.up_proj", "model.layers.81.mlp.experts.78.up_proj", "model.layers.81.mlp.experts.79.up_proj", "model.layers.81.mlp.experts.80.up_proj", "model.layers.81.mlp.experts.81.up_proj", "model.layers.81.mlp.experts.82.up_proj", "model.layers.81.mlp.experts.83.up_proj", "model.layers.81.mlp.experts.84.up_proj", "model.layers.81.mlp.experts.85.up_proj", "model.layers.81.mlp.experts.86.up_proj", "model.layers.81.mlp.experts.87.up_proj", "model.layers.81.mlp.experts.88.up_proj", "model.layers.81.mlp.experts.89.up_proj", "model.layers.81.mlp.experts.90.up_proj", "model.layers.81.mlp.experts.91.up_proj", "model.layers.81.mlp.experts.92.up_proj", "model.layers.81.mlp.experts.93.up_proj", "model.layers.81.mlp.experts.94.up_proj", "model.layers.81.mlp.experts.95.up_proj", "model.layers.81.mlp.experts.96.up_proj", "model.layers.81.mlp.experts.97.up_proj", "model.layers.81.mlp.experts.98.up_proj", "model.layers.81.mlp.experts.99.up_proj", "model.layers.81.mlp.experts.100.up_proj", "model.layers.81.mlp.experts.101.up_proj", "model.layers.81.mlp.experts.102.up_proj", "model.layers.81.mlp.experts.103.up_proj", "model.layers.81.mlp.experts.104.up_proj", "model.layers.81.mlp.experts.105.up_proj", "model.layers.81.mlp.experts.106.up_proj", "model.layers.81.mlp.experts.107.up_proj", "model.layers.81.mlp.experts.108.up_proj", "model.layers.81.mlp.experts.109.up_proj", "model.layers.81.mlp.experts.110.up_proj", "model.layers.81.mlp.experts.111.up_proj", "model.layers.81.mlp.experts.112.up_proj", "model.layers.81.mlp.experts.113.up_proj", "model.layers.81.mlp.experts.114.up_proj", "model.layers.81.mlp.experts.115.up_proj", "model.layers.81.mlp.experts.116.up_proj", "model.layers.81.mlp.experts.117.up_proj", "model.layers.81.mlp.experts.118.up_proj", "model.layers.81.mlp.experts.119.up_proj", "model.layers.81.mlp.experts.120.up_proj", "model.layers.81.mlp.experts.121.up_proj", "model.layers.81.mlp.experts.122.up_proj", "model.layers.81.mlp.experts.123.up_proj", "model.layers.81.mlp.experts.124.up_proj", "model.layers.81.mlp.experts.125.up_proj", "model.layers.81.mlp.experts.126.up_proj", "model.layers.81.mlp.experts.127.up_proj", "model.layers.81.mlp.experts.128.up_proj", "model.layers.81.mlp.experts.129.up_proj", "model.layers.81.mlp.experts.130.up_proj", "model.layers.81.mlp.experts.131.up_proj", "model.layers.81.mlp.experts.132.up_proj", "model.layers.81.mlp.experts.133.up_proj", "model.layers.81.mlp.experts.134.up_proj", "model.layers.81.mlp.experts.135.up_proj", "model.layers.81.mlp.experts.136.up_proj", "model.layers.81.mlp.experts.137.up_proj", "model.layers.81.mlp.experts.138.up_proj", "model.layers.81.mlp.experts.139.up_proj", "model.layers.81.mlp.experts.140.up_proj", "model.layers.81.mlp.experts.141.up_proj", "model.layers.81.mlp.experts.142.up_proj", "model.layers.81.mlp.experts.143.up_proj", "model.layers.81.mlp.experts.144.up_proj", "model.layers.81.mlp.experts.145.up_proj", "model.layers.81.mlp.experts.146.up_proj", "model.layers.81.mlp.experts.147.up_proj", "model.layers.81.mlp.experts.148.up_proj", "model.layers.81.mlp.experts.149.up_proj", "model.layers.81.mlp.experts.150.up_proj", "model.layers.81.mlp.experts.151.up_proj", "model.layers.81.mlp.experts.152.up_proj", "model.layers.81.mlp.experts.153.up_proj", "model.layers.81.mlp.experts.154.up_proj", "model.layers.81.mlp.experts.155.up_proj", "model.layers.81.mlp.experts.156.up_proj", "model.layers.81.mlp.experts.157.up_proj", "model.layers.81.mlp.experts.158.up_proj", "model.layers.81.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -9.149755351245056e-06, "dbits": 2516582400 }, { "dkld": -2.1994207054376255e-05, "dbits": 5033164800 } ] }, { "idx": 488, "layers": [ "model.layers.81.mlp.experts.0.down_proj", "model.layers.81.mlp.experts.1.down_proj", "model.layers.81.mlp.experts.2.down_proj", "model.layers.81.mlp.experts.3.down_proj", "model.layers.81.mlp.experts.4.down_proj", "model.layers.81.mlp.experts.5.down_proj", "model.layers.81.mlp.experts.6.down_proj", "model.layers.81.mlp.experts.7.down_proj", "model.layers.81.mlp.experts.8.down_proj", "model.layers.81.mlp.experts.9.down_proj", "model.layers.81.mlp.experts.10.down_proj", "model.layers.81.mlp.experts.11.down_proj", "model.layers.81.mlp.experts.12.down_proj", "model.layers.81.mlp.experts.13.down_proj", "model.layers.81.mlp.experts.14.down_proj", "model.layers.81.mlp.experts.15.down_proj", "model.layers.81.mlp.experts.16.down_proj", "model.layers.81.mlp.experts.17.down_proj", "model.layers.81.mlp.experts.18.down_proj", "model.layers.81.mlp.experts.19.down_proj", "model.layers.81.mlp.experts.20.down_proj", "model.layers.81.mlp.experts.21.down_proj", "model.layers.81.mlp.experts.22.down_proj", "model.layers.81.mlp.experts.23.down_proj", "model.layers.81.mlp.experts.24.down_proj", "model.layers.81.mlp.experts.25.down_proj", "model.layers.81.mlp.experts.26.down_proj", "model.layers.81.mlp.experts.27.down_proj", "model.layers.81.mlp.experts.28.down_proj", "model.layers.81.mlp.experts.29.down_proj", "model.layers.81.mlp.experts.30.down_proj", "model.layers.81.mlp.experts.31.down_proj", "model.layers.81.mlp.experts.32.down_proj", "model.layers.81.mlp.experts.33.down_proj", "model.layers.81.mlp.experts.34.down_proj", "model.layers.81.mlp.experts.35.down_proj", "model.layers.81.mlp.experts.36.down_proj", "model.layers.81.mlp.experts.37.down_proj", "model.layers.81.mlp.experts.38.down_proj", "model.layers.81.mlp.experts.39.down_proj", "model.layers.81.mlp.experts.40.down_proj", "model.layers.81.mlp.experts.41.down_proj", "model.layers.81.mlp.experts.42.down_proj", "model.layers.81.mlp.experts.43.down_proj", "model.layers.81.mlp.experts.44.down_proj", "model.layers.81.mlp.experts.45.down_proj", "model.layers.81.mlp.experts.46.down_proj", "model.layers.81.mlp.experts.47.down_proj", "model.layers.81.mlp.experts.48.down_proj", "model.layers.81.mlp.experts.49.down_proj", "model.layers.81.mlp.experts.50.down_proj", "model.layers.81.mlp.experts.51.down_proj", "model.layers.81.mlp.experts.52.down_proj", "model.layers.81.mlp.experts.53.down_proj", "model.layers.81.mlp.experts.54.down_proj", "model.layers.81.mlp.experts.55.down_proj", "model.layers.81.mlp.experts.56.down_proj", "model.layers.81.mlp.experts.57.down_proj", "model.layers.81.mlp.experts.58.down_proj", "model.layers.81.mlp.experts.59.down_proj", "model.layers.81.mlp.experts.60.down_proj", "model.layers.81.mlp.experts.61.down_proj", "model.layers.81.mlp.experts.62.down_proj", "model.layers.81.mlp.experts.63.down_proj", "model.layers.81.mlp.experts.64.down_proj", "model.layers.81.mlp.experts.65.down_proj", "model.layers.81.mlp.experts.66.down_proj", "model.layers.81.mlp.experts.67.down_proj", "model.layers.81.mlp.experts.68.down_proj", "model.layers.81.mlp.experts.69.down_proj", "model.layers.81.mlp.experts.70.down_proj", "model.layers.81.mlp.experts.71.down_proj", "model.layers.81.mlp.experts.72.down_proj", "model.layers.81.mlp.experts.73.down_proj", "model.layers.81.mlp.experts.74.down_proj", "model.layers.81.mlp.experts.75.down_proj", "model.layers.81.mlp.experts.76.down_proj", "model.layers.81.mlp.experts.77.down_proj", "model.layers.81.mlp.experts.78.down_proj", "model.layers.81.mlp.experts.79.down_proj", "model.layers.81.mlp.experts.80.down_proj", "model.layers.81.mlp.experts.81.down_proj", "model.layers.81.mlp.experts.82.down_proj", "model.layers.81.mlp.experts.83.down_proj", "model.layers.81.mlp.experts.84.down_proj", "model.layers.81.mlp.experts.85.down_proj", "model.layers.81.mlp.experts.86.down_proj", "model.layers.81.mlp.experts.87.down_proj", "model.layers.81.mlp.experts.88.down_proj", "model.layers.81.mlp.experts.89.down_proj", "model.layers.81.mlp.experts.90.down_proj", "model.layers.81.mlp.experts.91.down_proj", "model.layers.81.mlp.experts.92.down_proj", "model.layers.81.mlp.experts.93.down_proj", "model.layers.81.mlp.experts.94.down_proj", "model.layers.81.mlp.experts.95.down_proj", "model.layers.81.mlp.experts.96.down_proj", "model.layers.81.mlp.experts.97.down_proj", "model.layers.81.mlp.experts.98.down_proj", "model.layers.81.mlp.experts.99.down_proj", "model.layers.81.mlp.experts.100.down_proj", "model.layers.81.mlp.experts.101.down_proj", "model.layers.81.mlp.experts.102.down_proj", "model.layers.81.mlp.experts.103.down_proj", "model.layers.81.mlp.experts.104.down_proj", "model.layers.81.mlp.experts.105.down_proj", "model.layers.81.mlp.experts.106.down_proj", "model.layers.81.mlp.experts.107.down_proj", "model.layers.81.mlp.experts.108.down_proj", "model.layers.81.mlp.experts.109.down_proj", "model.layers.81.mlp.experts.110.down_proj", "model.layers.81.mlp.experts.111.down_proj", "model.layers.81.mlp.experts.112.down_proj", "model.layers.81.mlp.experts.113.down_proj", "model.layers.81.mlp.experts.114.down_proj", "model.layers.81.mlp.experts.115.down_proj", "model.layers.81.mlp.experts.116.down_proj", "model.layers.81.mlp.experts.117.down_proj", "model.layers.81.mlp.experts.118.down_proj", "model.layers.81.mlp.experts.119.down_proj", "model.layers.81.mlp.experts.120.down_proj", "model.layers.81.mlp.experts.121.down_proj", "model.layers.81.mlp.experts.122.down_proj", "model.layers.81.mlp.experts.123.down_proj", "model.layers.81.mlp.experts.124.down_proj", "model.layers.81.mlp.experts.125.down_proj", "model.layers.81.mlp.experts.126.down_proj", "model.layers.81.mlp.experts.127.down_proj", "model.layers.81.mlp.experts.128.down_proj", "model.layers.81.mlp.experts.129.down_proj", "model.layers.81.mlp.experts.130.down_proj", "model.layers.81.mlp.experts.131.down_proj", "model.layers.81.mlp.experts.132.down_proj", "model.layers.81.mlp.experts.133.down_proj", "model.layers.81.mlp.experts.134.down_proj", "model.layers.81.mlp.experts.135.down_proj", "model.layers.81.mlp.experts.136.down_proj", "model.layers.81.mlp.experts.137.down_proj", "model.layers.81.mlp.experts.138.down_proj", "model.layers.81.mlp.experts.139.down_proj", "model.layers.81.mlp.experts.140.down_proj", "model.layers.81.mlp.experts.141.down_proj", "model.layers.81.mlp.experts.142.down_proj", "model.layers.81.mlp.experts.143.down_proj", "model.layers.81.mlp.experts.144.down_proj", "model.layers.81.mlp.experts.145.down_proj", "model.layers.81.mlp.experts.146.down_proj", "model.layers.81.mlp.experts.147.down_proj", "model.layers.81.mlp.experts.148.down_proj", "model.layers.81.mlp.experts.149.down_proj", "model.layers.81.mlp.experts.150.down_proj", "model.layers.81.mlp.experts.151.down_proj", "model.layers.81.mlp.experts.152.down_proj", "model.layers.81.mlp.experts.153.down_proj", "model.layers.81.mlp.experts.154.down_proj", "model.layers.81.mlp.experts.155.down_proj", "model.layers.81.mlp.experts.156.down_proj", "model.layers.81.mlp.experts.157.down_proj", "model.layers.81.mlp.experts.158.down_proj", "model.layers.81.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.2659886851906083e-05, "dbits": 1258291200 }, { "dkld": -1.1879554949700138e-05, "dbits": 2516582400 } ] }, { "idx": 489, "layers": [ "model.layers.82.self_attn.q_proj" ], "candidates": [ { "dkld": -1.7458549700677048e-05, "dbits": 62914560 }, { "dkld": -1.7895735800264878e-05, "dbits": 125829120 } ] }, { "idx": 490, "layers": [ "model.layers.82.self_attn.k_proj", "model.layers.82.self_attn.v_proj" ], "candidates": [ { "dkld": -9.354173671454087e-05, "dbits": 10485760 }, { "dkld": -7.775467820465495e-05, "dbits": 20971520 } ] }, { "idx": 491, "layers": [ "model.layers.82.self_attn.o_proj" ], "candidates": [ { "dkld": -6.817937828600303e-05, "dbits": 62914560 }, { "dkld": -6.763380952179432e-05, "dbits": 125829120 } ] }, { "idx": 492, "layers": [ "model.layers.82.mlp.shared_experts.gate_proj", "model.layers.82.mlp.shared_experts.up_proj", "model.layers.82.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 2.5461358018220165e-05, "dbits": 23592960 }, { "dkld": -2.2982992231844815e-05, "dbits": 47185920 } ] }, { "idx": 493, "layers": [ "model.layers.82.mlp.experts.0.gate_proj", "model.layers.82.mlp.experts.1.gate_proj", "model.layers.82.mlp.experts.2.gate_proj", "model.layers.82.mlp.experts.3.gate_proj", "model.layers.82.mlp.experts.4.gate_proj", "model.layers.82.mlp.experts.5.gate_proj", "model.layers.82.mlp.experts.6.gate_proj", "model.layers.82.mlp.experts.7.gate_proj", "model.layers.82.mlp.experts.8.gate_proj", "model.layers.82.mlp.experts.9.gate_proj", "model.layers.82.mlp.experts.10.gate_proj", "model.layers.82.mlp.experts.11.gate_proj", "model.layers.82.mlp.experts.12.gate_proj", "model.layers.82.mlp.experts.13.gate_proj", "model.layers.82.mlp.experts.14.gate_proj", "model.layers.82.mlp.experts.15.gate_proj", "model.layers.82.mlp.experts.16.gate_proj", "model.layers.82.mlp.experts.17.gate_proj", "model.layers.82.mlp.experts.18.gate_proj", "model.layers.82.mlp.experts.19.gate_proj", "model.layers.82.mlp.experts.20.gate_proj", "model.layers.82.mlp.experts.21.gate_proj", "model.layers.82.mlp.experts.22.gate_proj", "model.layers.82.mlp.experts.23.gate_proj", "model.layers.82.mlp.experts.24.gate_proj", "model.layers.82.mlp.experts.25.gate_proj", "model.layers.82.mlp.experts.26.gate_proj", "model.layers.82.mlp.experts.27.gate_proj", "model.layers.82.mlp.experts.28.gate_proj", "model.layers.82.mlp.experts.29.gate_proj", "model.layers.82.mlp.experts.30.gate_proj", "model.layers.82.mlp.experts.31.gate_proj", "model.layers.82.mlp.experts.32.gate_proj", "model.layers.82.mlp.experts.33.gate_proj", "model.layers.82.mlp.experts.34.gate_proj", "model.layers.82.mlp.experts.35.gate_proj", "model.layers.82.mlp.experts.36.gate_proj", "model.layers.82.mlp.experts.37.gate_proj", "model.layers.82.mlp.experts.38.gate_proj", "model.layers.82.mlp.experts.39.gate_proj", "model.layers.82.mlp.experts.40.gate_proj", "model.layers.82.mlp.experts.41.gate_proj", "model.layers.82.mlp.experts.42.gate_proj", "model.layers.82.mlp.experts.43.gate_proj", "model.layers.82.mlp.experts.44.gate_proj", "model.layers.82.mlp.experts.45.gate_proj", "model.layers.82.mlp.experts.46.gate_proj", "model.layers.82.mlp.experts.47.gate_proj", "model.layers.82.mlp.experts.48.gate_proj", "model.layers.82.mlp.experts.49.gate_proj", "model.layers.82.mlp.experts.50.gate_proj", "model.layers.82.mlp.experts.51.gate_proj", "model.layers.82.mlp.experts.52.gate_proj", "model.layers.82.mlp.experts.53.gate_proj", "model.layers.82.mlp.experts.54.gate_proj", "model.layers.82.mlp.experts.55.gate_proj", "model.layers.82.mlp.experts.56.gate_proj", "model.layers.82.mlp.experts.57.gate_proj", "model.layers.82.mlp.experts.58.gate_proj", "model.layers.82.mlp.experts.59.gate_proj", "model.layers.82.mlp.experts.60.gate_proj", "model.layers.82.mlp.experts.61.gate_proj", "model.layers.82.mlp.experts.62.gate_proj", "model.layers.82.mlp.experts.63.gate_proj", "model.layers.82.mlp.experts.64.gate_proj", "model.layers.82.mlp.experts.65.gate_proj", "model.layers.82.mlp.experts.66.gate_proj", "model.layers.82.mlp.experts.67.gate_proj", "model.layers.82.mlp.experts.68.gate_proj", "model.layers.82.mlp.experts.69.gate_proj", "model.layers.82.mlp.experts.70.gate_proj", "model.layers.82.mlp.experts.71.gate_proj", "model.layers.82.mlp.experts.72.gate_proj", "model.layers.82.mlp.experts.73.gate_proj", "model.layers.82.mlp.experts.74.gate_proj", "model.layers.82.mlp.experts.75.gate_proj", "model.layers.82.mlp.experts.76.gate_proj", "model.layers.82.mlp.experts.77.gate_proj", "model.layers.82.mlp.experts.78.gate_proj", "model.layers.82.mlp.experts.79.gate_proj", "model.layers.82.mlp.experts.80.gate_proj", "model.layers.82.mlp.experts.81.gate_proj", "model.layers.82.mlp.experts.82.gate_proj", "model.layers.82.mlp.experts.83.gate_proj", "model.layers.82.mlp.experts.84.gate_proj", "model.layers.82.mlp.experts.85.gate_proj", "model.layers.82.mlp.experts.86.gate_proj", "model.layers.82.mlp.experts.87.gate_proj", "model.layers.82.mlp.experts.88.gate_proj", "model.layers.82.mlp.experts.89.gate_proj", "model.layers.82.mlp.experts.90.gate_proj", "model.layers.82.mlp.experts.91.gate_proj", "model.layers.82.mlp.experts.92.gate_proj", "model.layers.82.mlp.experts.93.gate_proj", "model.layers.82.mlp.experts.94.gate_proj", "model.layers.82.mlp.experts.95.gate_proj", "model.layers.82.mlp.experts.96.gate_proj", "model.layers.82.mlp.experts.97.gate_proj", "model.layers.82.mlp.experts.98.gate_proj", "model.layers.82.mlp.experts.99.gate_proj", "model.layers.82.mlp.experts.100.gate_proj", "model.layers.82.mlp.experts.101.gate_proj", "model.layers.82.mlp.experts.102.gate_proj", "model.layers.82.mlp.experts.103.gate_proj", "model.layers.82.mlp.experts.104.gate_proj", "model.layers.82.mlp.experts.105.gate_proj", "model.layers.82.mlp.experts.106.gate_proj", "model.layers.82.mlp.experts.107.gate_proj", "model.layers.82.mlp.experts.108.gate_proj", "model.layers.82.mlp.experts.109.gate_proj", "model.layers.82.mlp.experts.110.gate_proj", "model.layers.82.mlp.experts.111.gate_proj", "model.layers.82.mlp.experts.112.gate_proj", "model.layers.82.mlp.experts.113.gate_proj", "model.layers.82.mlp.experts.114.gate_proj", "model.layers.82.mlp.experts.115.gate_proj", "model.layers.82.mlp.experts.116.gate_proj", "model.layers.82.mlp.experts.117.gate_proj", "model.layers.82.mlp.experts.118.gate_proj", "model.layers.82.mlp.experts.119.gate_proj", "model.layers.82.mlp.experts.120.gate_proj", "model.layers.82.mlp.experts.121.gate_proj", "model.layers.82.mlp.experts.122.gate_proj", "model.layers.82.mlp.experts.123.gate_proj", "model.layers.82.mlp.experts.124.gate_proj", "model.layers.82.mlp.experts.125.gate_proj", "model.layers.82.mlp.experts.126.gate_proj", "model.layers.82.mlp.experts.127.gate_proj", "model.layers.82.mlp.experts.128.gate_proj", "model.layers.82.mlp.experts.129.gate_proj", "model.layers.82.mlp.experts.130.gate_proj", "model.layers.82.mlp.experts.131.gate_proj", "model.layers.82.mlp.experts.132.gate_proj", "model.layers.82.mlp.experts.133.gate_proj", "model.layers.82.mlp.experts.134.gate_proj", "model.layers.82.mlp.experts.135.gate_proj", "model.layers.82.mlp.experts.136.gate_proj", "model.layers.82.mlp.experts.137.gate_proj", "model.layers.82.mlp.experts.138.gate_proj", "model.layers.82.mlp.experts.139.gate_proj", "model.layers.82.mlp.experts.140.gate_proj", "model.layers.82.mlp.experts.141.gate_proj", "model.layers.82.mlp.experts.142.gate_proj", "model.layers.82.mlp.experts.143.gate_proj", "model.layers.82.mlp.experts.144.gate_proj", "model.layers.82.mlp.experts.145.gate_proj", "model.layers.82.mlp.experts.146.gate_proj", "model.layers.82.mlp.experts.147.gate_proj", "model.layers.82.mlp.experts.148.gate_proj", "model.layers.82.mlp.experts.149.gate_proj", "model.layers.82.mlp.experts.150.gate_proj", "model.layers.82.mlp.experts.151.gate_proj", "model.layers.82.mlp.experts.152.gate_proj", "model.layers.82.mlp.experts.153.gate_proj", "model.layers.82.mlp.experts.154.gate_proj", "model.layers.82.mlp.experts.155.gate_proj", "model.layers.82.mlp.experts.156.gate_proj", "model.layers.82.mlp.experts.157.gate_proj", "model.layers.82.mlp.experts.158.gate_proj", "model.layers.82.mlp.experts.159.gate_proj", "model.layers.82.mlp.experts.0.up_proj", "model.layers.82.mlp.experts.1.up_proj", "model.layers.82.mlp.experts.2.up_proj", "model.layers.82.mlp.experts.3.up_proj", "model.layers.82.mlp.experts.4.up_proj", "model.layers.82.mlp.experts.5.up_proj", "model.layers.82.mlp.experts.6.up_proj", "model.layers.82.mlp.experts.7.up_proj", "model.layers.82.mlp.experts.8.up_proj", "model.layers.82.mlp.experts.9.up_proj", "model.layers.82.mlp.experts.10.up_proj", "model.layers.82.mlp.experts.11.up_proj", "model.layers.82.mlp.experts.12.up_proj", "model.layers.82.mlp.experts.13.up_proj", "model.layers.82.mlp.experts.14.up_proj", "model.layers.82.mlp.experts.15.up_proj", "model.layers.82.mlp.experts.16.up_proj", "model.layers.82.mlp.experts.17.up_proj", "model.layers.82.mlp.experts.18.up_proj", "model.layers.82.mlp.experts.19.up_proj", "model.layers.82.mlp.experts.20.up_proj", "model.layers.82.mlp.experts.21.up_proj", "model.layers.82.mlp.experts.22.up_proj", "model.layers.82.mlp.experts.23.up_proj", "model.layers.82.mlp.experts.24.up_proj", "model.layers.82.mlp.experts.25.up_proj", "model.layers.82.mlp.experts.26.up_proj", "model.layers.82.mlp.experts.27.up_proj", "model.layers.82.mlp.experts.28.up_proj", "model.layers.82.mlp.experts.29.up_proj", "model.layers.82.mlp.experts.30.up_proj", "model.layers.82.mlp.experts.31.up_proj", "model.layers.82.mlp.experts.32.up_proj", "model.layers.82.mlp.experts.33.up_proj", "model.layers.82.mlp.experts.34.up_proj", "model.layers.82.mlp.experts.35.up_proj", "model.layers.82.mlp.experts.36.up_proj", "model.layers.82.mlp.experts.37.up_proj", "model.layers.82.mlp.experts.38.up_proj", "model.layers.82.mlp.experts.39.up_proj", "model.layers.82.mlp.experts.40.up_proj", "model.layers.82.mlp.experts.41.up_proj", "model.layers.82.mlp.experts.42.up_proj", "model.layers.82.mlp.experts.43.up_proj", "model.layers.82.mlp.experts.44.up_proj", "model.layers.82.mlp.experts.45.up_proj", "model.layers.82.mlp.experts.46.up_proj", "model.layers.82.mlp.experts.47.up_proj", "model.layers.82.mlp.experts.48.up_proj", "model.layers.82.mlp.experts.49.up_proj", "model.layers.82.mlp.experts.50.up_proj", "model.layers.82.mlp.experts.51.up_proj", "model.layers.82.mlp.experts.52.up_proj", "model.layers.82.mlp.experts.53.up_proj", "model.layers.82.mlp.experts.54.up_proj", "model.layers.82.mlp.experts.55.up_proj", "model.layers.82.mlp.experts.56.up_proj", "model.layers.82.mlp.experts.57.up_proj", "model.layers.82.mlp.experts.58.up_proj", "model.layers.82.mlp.experts.59.up_proj", "model.layers.82.mlp.experts.60.up_proj", "model.layers.82.mlp.experts.61.up_proj", "model.layers.82.mlp.experts.62.up_proj", "model.layers.82.mlp.experts.63.up_proj", "model.layers.82.mlp.experts.64.up_proj", "model.layers.82.mlp.experts.65.up_proj", "model.layers.82.mlp.experts.66.up_proj", "model.layers.82.mlp.experts.67.up_proj", "model.layers.82.mlp.experts.68.up_proj", "model.layers.82.mlp.experts.69.up_proj", "model.layers.82.mlp.experts.70.up_proj", "model.layers.82.mlp.experts.71.up_proj", "model.layers.82.mlp.experts.72.up_proj", "model.layers.82.mlp.experts.73.up_proj", "model.layers.82.mlp.experts.74.up_proj", "model.layers.82.mlp.experts.75.up_proj", "model.layers.82.mlp.experts.76.up_proj", "model.layers.82.mlp.experts.77.up_proj", "model.layers.82.mlp.experts.78.up_proj", "model.layers.82.mlp.experts.79.up_proj", "model.layers.82.mlp.experts.80.up_proj", "model.layers.82.mlp.experts.81.up_proj", "model.layers.82.mlp.experts.82.up_proj", "model.layers.82.mlp.experts.83.up_proj", "model.layers.82.mlp.experts.84.up_proj", "model.layers.82.mlp.experts.85.up_proj", "model.layers.82.mlp.experts.86.up_proj", "model.layers.82.mlp.experts.87.up_proj", "model.layers.82.mlp.experts.88.up_proj", "model.layers.82.mlp.experts.89.up_proj", "model.layers.82.mlp.experts.90.up_proj", "model.layers.82.mlp.experts.91.up_proj", "model.layers.82.mlp.experts.92.up_proj", "model.layers.82.mlp.experts.93.up_proj", "model.layers.82.mlp.experts.94.up_proj", "model.layers.82.mlp.experts.95.up_proj", "model.layers.82.mlp.experts.96.up_proj", "model.layers.82.mlp.experts.97.up_proj", "model.layers.82.mlp.experts.98.up_proj", "model.layers.82.mlp.experts.99.up_proj", "model.layers.82.mlp.experts.100.up_proj", "model.layers.82.mlp.experts.101.up_proj", "model.layers.82.mlp.experts.102.up_proj", "model.layers.82.mlp.experts.103.up_proj", "model.layers.82.mlp.experts.104.up_proj", "model.layers.82.mlp.experts.105.up_proj", "model.layers.82.mlp.experts.106.up_proj", "model.layers.82.mlp.experts.107.up_proj", "model.layers.82.mlp.experts.108.up_proj", "model.layers.82.mlp.experts.109.up_proj", "model.layers.82.mlp.experts.110.up_proj", "model.layers.82.mlp.experts.111.up_proj", "model.layers.82.mlp.experts.112.up_proj", "model.layers.82.mlp.experts.113.up_proj", "model.layers.82.mlp.experts.114.up_proj", "model.layers.82.mlp.experts.115.up_proj", "model.layers.82.mlp.experts.116.up_proj", "model.layers.82.mlp.experts.117.up_proj", "model.layers.82.mlp.experts.118.up_proj", "model.layers.82.mlp.experts.119.up_proj", "model.layers.82.mlp.experts.120.up_proj", "model.layers.82.mlp.experts.121.up_proj", "model.layers.82.mlp.experts.122.up_proj", "model.layers.82.mlp.experts.123.up_proj", "model.layers.82.mlp.experts.124.up_proj", "model.layers.82.mlp.experts.125.up_proj", "model.layers.82.mlp.experts.126.up_proj", "model.layers.82.mlp.experts.127.up_proj", "model.layers.82.mlp.experts.128.up_proj", "model.layers.82.mlp.experts.129.up_proj", "model.layers.82.mlp.experts.130.up_proj", "model.layers.82.mlp.experts.131.up_proj", "model.layers.82.mlp.experts.132.up_proj", "model.layers.82.mlp.experts.133.up_proj", "model.layers.82.mlp.experts.134.up_proj", "model.layers.82.mlp.experts.135.up_proj", "model.layers.82.mlp.experts.136.up_proj", "model.layers.82.mlp.experts.137.up_proj", "model.layers.82.mlp.experts.138.up_proj", "model.layers.82.mlp.experts.139.up_proj", "model.layers.82.mlp.experts.140.up_proj", "model.layers.82.mlp.experts.141.up_proj", "model.layers.82.mlp.experts.142.up_proj", "model.layers.82.mlp.experts.143.up_proj", "model.layers.82.mlp.experts.144.up_proj", "model.layers.82.mlp.experts.145.up_proj", "model.layers.82.mlp.experts.146.up_proj", "model.layers.82.mlp.experts.147.up_proj", "model.layers.82.mlp.experts.148.up_proj", "model.layers.82.mlp.experts.149.up_proj", "model.layers.82.mlp.experts.150.up_proj", "model.layers.82.mlp.experts.151.up_proj", "model.layers.82.mlp.experts.152.up_proj", "model.layers.82.mlp.experts.153.up_proj", "model.layers.82.mlp.experts.154.up_proj", "model.layers.82.mlp.experts.155.up_proj", "model.layers.82.mlp.experts.156.up_proj", "model.layers.82.mlp.experts.157.up_proj", "model.layers.82.mlp.experts.158.up_proj", "model.layers.82.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.716576516628404e-05, "dbits": 2516582400 }, { "dkld": 1.3368786312639713e-05, "dbits": 5033164800 } ] }, { "idx": 494, "layers": [ "model.layers.82.mlp.experts.0.down_proj", "model.layers.82.mlp.experts.1.down_proj", "model.layers.82.mlp.experts.2.down_proj", "model.layers.82.mlp.experts.3.down_proj", "model.layers.82.mlp.experts.4.down_proj", "model.layers.82.mlp.experts.5.down_proj", "model.layers.82.mlp.experts.6.down_proj", "model.layers.82.mlp.experts.7.down_proj", "model.layers.82.mlp.experts.8.down_proj", "model.layers.82.mlp.experts.9.down_proj", "model.layers.82.mlp.experts.10.down_proj", "model.layers.82.mlp.experts.11.down_proj", "model.layers.82.mlp.experts.12.down_proj", "model.layers.82.mlp.experts.13.down_proj", "model.layers.82.mlp.experts.14.down_proj", "model.layers.82.mlp.experts.15.down_proj", "model.layers.82.mlp.experts.16.down_proj", "model.layers.82.mlp.experts.17.down_proj", "model.layers.82.mlp.experts.18.down_proj", "model.layers.82.mlp.experts.19.down_proj", "model.layers.82.mlp.experts.20.down_proj", "model.layers.82.mlp.experts.21.down_proj", "model.layers.82.mlp.experts.22.down_proj", "model.layers.82.mlp.experts.23.down_proj", "model.layers.82.mlp.experts.24.down_proj", "model.layers.82.mlp.experts.25.down_proj", "model.layers.82.mlp.experts.26.down_proj", "model.layers.82.mlp.experts.27.down_proj", "model.layers.82.mlp.experts.28.down_proj", "model.layers.82.mlp.experts.29.down_proj", "model.layers.82.mlp.experts.30.down_proj", "model.layers.82.mlp.experts.31.down_proj", "model.layers.82.mlp.experts.32.down_proj", "model.layers.82.mlp.experts.33.down_proj", "model.layers.82.mlp.experts.34.down_proj", "model.layers.82.mlp.experts.35.down_proj", "model.layers.82.mlp.experts.36.down_proj", "model.layers.82.mlp.experts.37.down_proj", "model.layers.82.mlp.experts.38.down_proj", "model.layers.82.mlp.experts.39.down_proj", "model.layers.82.mlp.experts.40.down_proj", "model.layers.82.mlp.experts.41.down_proj", "model.layers.82.mlp.experts.42.down_proj", "model.layers.82.mlp.experts.43.down_proj", "model.layers.82.mlp.experts.44.down_proj", "model.layers.82.mlp.experts.45.down_proj", "model.layers.82.mlp.experts.46.down_proj", "model.layers.82.mlp.experts.47.down_proj", "model.layers.82.mlp.experts.48.down_proj", "model.layers.82.mlp.experts.49.down_proj", "model.layers.82.mlp.experts.50.down_proj", "model.layers.82.mlp.experts.51.down_proj", "model.layers.82.mlp.experts.52.down_proj", "model.layers.82.mlp.experts.53.down_proj", "model.layers.82.mlp.experts.54.down_proj", "model.layers.82.mlp.experts.55.down_proj", "model.layers.82.mlp.experts.56.down_proj", "model.layers.82.mlp.experts.57.down_proj", "model.layers.82.mlp.experts.58.down_proj", "model.layers.82.mlp.experts.59.down_proj", "model.layers.82.mlp.experts.60.down_proj", "model.layers.82.mlp.experts.61.down_proj", "model.layers.82.mlp.experts.62.down_proj", "model.layers.82.mlp.experts.63.down_proj", "model.layers.82.mlp.experts.64.down_proj", "model.layers.82.mlp.experts.65.down_proj", "model.layers.82.mlp.experts.66.down_proj", "model.layers.82.mlp.experts.67.down_proj", "model.layers.82.mlp.experts.68.down_proj", "model.layers.82.mlp.experts.69.down_proj", "model.layers.82.mlp.experts.70.down_proj", "model.layers.82.mlp.experts.71.down_proj", "model.layers.82.mlp.experts.72.down_proj", "model.layers.82.mlp.experts.73.down_proj", "model.layers.82.mlp.experts.74.down_proj", "model.layers.82.mlp.experts.75.down_proj", "model.layers.82.mlp.experts.76.down_proj", "model.layers.82.mlp.experts.77.down_proj", "model.layers.82.mlp.experts.78.down_proj", "model.layers.82.mlp.experts.79.down_proj", "model.layers.82.mlp.experts.80.down_proj", "model.layers.82.mlp.experts.81.down_proj", "model.layers.82.mlp.experts.82.down_proj", "model.layers.82.mlp.experts.83.down_proj", "model.layers.82.mlp.experts.84.down_proj", "model.layers.82.mlp.experts.85.down_proj", "model.layers.82.mlp.experts.86.down_proj", "model.layers.82.mlp.experts.87.down_proj", "model.layers.82.mlp.experts.88.down_proj", "model.layers.82.mlp.experts.89.down_proj", "model.layers.82.mlp.experts.90.down_proj", "model.layers.82.mlp.experts.91.down_proj", "model.layers.82.mlp.experts.92.down_proj", "model.layers.82.mlp.experts.93.down_proj", "model.layers.82.mlp.experts.94.down_proj", "model.layers.82.mlp.experts.95.down_proj", "model.layers.82.mlp.experts.96.down_proj", "model.layers.82.mlp.experts.97.down_proj", "model.layers.82.mlp.experts.98.down_proj", "model.layers.82.mlp.experts.99.down_proj", "model.layers.82.mlp.experts.100.down_proj", "model.layers.82.mlp.experts.101.down_proj", "model.layers.82.mlp.experts.102.down_proj", "model.layers.82.mlp.experts.103.down_proj", "model.layers.82.mlp.experts.104.down_proj", "model.layers.82.mlp.experts.105.down_proj", "model.layers.82.mlp.experts.106.down_proj", "model.layers.82.mlp.experts.107.down_proj", "model.layers.82.mlp.experts.108.down_proj", "model.layers.82.mlp.experts.109.down_proj", "model.layers.82.mlp.experts.110.down_proj", "model.layers.82.mlp.experts.111.down_proj", "model.layers.82.mlp.experts.112.down_proj", "model.layers.82.mlp.experts.113.down_proj", "model.layers.82.mlp.experts.114.down_proj", "model.layers.82.mlp.experts.115.down_proj", "model.layers.82.mlp.experts.116.down_proj", "model.layers.82.mlp.experts.117.down_proj", "model.layers.82.mlp.experts.118.down_proj", "model.layers.82.mlp.experts.119.down_proj", "model.layers.82.mlp.experts.120.down_proj", "model.layers.82.mlp.experts.121.down_proj", "model.layers.82.mlp.experts.122.down_proj", "model.layers.82.mlp.experts.123.down_proj", "model.layers.82.mlp.experts.124.down_proj", "model.layers.82.mlp.experts.125.down_proj", "model.layers.82.mlp.experts.126.down_proj", "model.layers.82.mlp.experts.127.down_proj", "model.layers.82.mlp.experts.128.down_proj", "model.layers.82.mlp.experts.129.down_proj", "model.layers.82.mlp.experts.130.down_proj", "model.layers.82.mlp.experts.131.down_proj", "model.layers.82.mlp.experts.132.down_proj", "model.layers.82.mlp.experts.133.down_proj", "model.layers.82.mlp.experts.134.down_proj", "model.layers.82.mlp.experts.135.down_proj", "model.layers.82.mlp.experts.136.down_proj", "model.layers.82.mlp.experts.137.down_proj", "model.layers.82.mlp.experts.138.down_proj", "model.layers.82.mlp.experts.139.down_proj", "model.layers.82.mlp.experts.140.down_proj", "model.layers.82.mlp.experts.141.down_proj", "model.layers.82.mlp.experts.142.down_proj", "model.layers.82.mlp.experts.143.down_proj", "model.layers.82.mlp.experts.144.down_proj", "model.layers.82.mlp.experts.145.down_proj", "model.layers.82.mlp.experts.146.down_proj", "model.layers.82.mlp.experts.147.down_proj", "model.layers.82.mlp.experts.148.down_proj", "model.layers.82.mlp.experts.149.down_proj", "model.layers.82.mlp.experts.150.down_proj", "model.layers.82.mlp.experts.151.down_proj", "model.layers.82.mlp.experts.152.down_proj", "model.layers.82.mlp.experts.153.down_proj", "model.layers.82.mlp.experts.154.down_proj", "model.layers.82.mlp.experts.155.down_proj", "model.layers.82.mlp.experts.156.down_proj", "model.layers.82.mlp.experts.157.down_proj", "model.layers.82.mlp.experts.158.down_proj", "model.layers.82.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 8.841790258885124e-06, "dbits": 1258291200 }, { "dkld": 6.555253639817585e-06, "dbits": 2516582400 } ] }, { "idx": 495, "layers": [ "model.layers.83.self_attn.q_proj" ], "candidates": [ { "dkld": 1.0487553663552501e-05, "dbits": 62914560 }, { "dkld": -3.673881292342099e-06, "dbits": 125829120 } ] }, { "idx": 496, "layers": [ "model.layers.83.self_attn.k_proj", "model.layers.83.self_attn.v_proj" ], "candidates": [ { "dkld": -0.00013102882076054811, "dbits": 10485760 }, { "dkld": -0.00013577742502093176, "dbits": 20971520 } ] }, { "idx": 497, "layers": [ "model.layers.83.self_attn.o_proj" ], "candidates": [ { "dkld": -4.825063515454496e-05, "dbits": 62914560 }, { "dkld": -2.646739594638209e-05, "dbits": 125829120 } ] }, { "idx": 498, "layers": [ "model.layers.83.mlp.shared_experts.gate_proj", "model.layers.83.mlp.shared_experts.up_proj", "model.layers.83.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -2.5606807321309696e-05, "dbits": 23592960 }, { "dkld": -4.200199618935481e-05, "dbits": 47185920 } ] }, { "idx": 499, "layers": [ "model.layers.83.mlp.experts.0.gate_proj", "model.layers.83.mlp.experts.1.gate_proj", "model.layers.83.mlp.experts.2.gate_proj", "model.layers.83.mlp.experts.3.gate_proj", "model.layers.83.mlp.experts.4.gate_proj", "model.layers.83.mlp.experts.5.gate_proj", "model.layers.83.mlp.experts.6.gate_proj", "model.layers.83.mlp.experts.7.gate_proj", "model.layers.83.mlp.experts.8.gate_proj", "model.layers.83.mlp.experts.9.gate_proj", "model.layers.83.mlp.experts.10.gate_proj", "model.layers.83.mlp.experts.11.gate_proj", "model.layers.83.mlp.experts.12.gate_proj", "model.layers.83.mlp.experts.13.gate_proj", "model.layers.83.mlp.experts.14.gate_proj", "model.layers.83.mlp.experts.15.gate_proj", "model.layers.83.mlp.experts.16.gate_proj", "model.layers.83.mlp.experts.17.gate_proj", "model.layers.83.mlp.experts.18.gate_proj", "model.layers.83.mlp.experts.19.gate_proj", "model.layers.83.mlp.experts.20.gate_proj", "model.layers.83.mlp.experts.21.gate_proj", "model.layers.83.mlp.experts.22.gate_proj", "model.layers.83.mlp.experts.23.gate_proj", "model.layers.83.mlp.experts.24.gate_proj", "model.layers.83.mlp.experts.25.gate_proj", "model.layers.83.mlp.experts.26.gate_proj", "model.layers.83.mlp.experts.27.gate_proj", "model.layers.83.mlp.experts.28.gate_proj", "model.layers.83.mlp.experts.29.gate_proj", "model.layers.83.mlp.experts.30.gate_proj", "model.layers.83.mlp.experts.31.gate_proj", "model.layers.83.mlp.experts.32.gate_proj", "model.layers.83.mlp.experts.33.gate_proj", "model.layers.83.mlp.experts.34.gate_proj", "model.layers.83.mlp.experts.35.gate_proj", "model.layers.83.mlp.experts.36.gate_proj", "model.layers.83.mlp.experts.37.gate_proj", "model.layers.83.mlp.experts.38.gate_proj", "model.layers.83.mlp.experts.39.gate_proj", "model.layers.83.mlp.experts.40.gate_proj", "model.layers.83.mlp.experts.41.gate_proj", "model.layers.83.mlp.experts.42.gate_proj", "model.layers.83.mlp.experts.43.gate_proj", "model.layers.83.mlp.experts.44.gate_proj", "model.layers.83.mlp.experts.45.gate_proj", "model.layers.83.mlp.experts.46.gate_proj", "model.layers.83.mlp.experts.47.gate_proj", "model.layers.83.mlp.experts.48.gate_proj", "model.layers.83.mlp.experts.49.gate_proj", "model.layers.83.mlp.experts.50.gate_proj", "model.layers.83.mlp.experts.51.gate_proj", "model.layers.83.mlp.experts.52.gate_proj", "model.layers.83.mlp.experts.53.gate_proj", "model.layers.83.mlp.experts.54.gate_proj", "model.layers.83.mlp.experts.55.gate_proj", "model.layers.83.mlp.experts.56.gate_proj", "model.layers.83.mlp.experts.57.gate_proj", "model.layers.83.mlp.experts.58.gate_proj", "model.layers.83.mlp.experts.59.gate_proj", "model.layers.83.mlp.experts.60.gate_proj", "model.layers.83.mlp.experts.61.gate_proj", "model.layers.83.mlp.experts.62.gate_proj", "model.layers.83.mlp.experts.63.gate_proj", "model.layers.83.mlp.experts.64.gate_proj", "model.layers.83.mlp.experts.65.gate_proj", "model.layers.83.mlp.experts.66.gate_proj", "model.layers.83.mlp.experts.67.gate_proj", "model.layers.83.mlp.experts.68.gate_proj", "model.layers.83.mlp.experts.69.gate_proj", "model.layers.83.mlp.experts.70.gate_proj", "model.layers.83.mlp.experts.71.gate_proj", "model.layers.83.mlp.experts.72.gate_proj", "model.layers.83.mlp.experts.73.gate_proj", "model.layers.83.mlp.experts.74.gate_proj", "model.layers.83.mlp.experts.75.gate_proj", "model.layers.83.mlp.experts.76.gate_proj", "model.layers.83.mlp.experts.77.gate_proj", "model.layers.83.mlp.experts.78.gate_proj", "model.layers.83.mlp.experts.79.gate_proj", "model.layers.83.mlp.experts.80.gate_proj", "model.layers.83.mlp.experts.81.gate_proj", "model.layers.83.mlp.experts.82.gate_proj", "model.layers.83.mlp.experts.83.gate_proj", "model.layers.83.mlp.experts.84.gate_proj", "model.layers.83.mlp.experts.85.gate_proj", "model.layers.83.mlp.experts.86.gate_proj", "model.layers.83.mlp.experts.87.gate_proj", "model.layers.83.mlp.experts.88.gate_proj", "model.layers.83.mlp.experts.89.gate_proj", "model.layers.83.mlp.experts.90.gate_proj", "model.layers.83.mlp.experts.91.gate_proj", "model.layers.83.mlp.experts.92.gate_proj", "model.layers.83.mlp.experts.93.gate_proj", "model.layers.83.mlp.experts.94.gate_proj", "model.layers.83.mlp.experts.95.gate_proj", "model.layers.83.mlp.experts.96.gate_proj", "model.layers.83.mlp.experts.97.gate_proj", "model.layers.83.mlp.experts.98.gate_proj", "model.layers.83.mlp.experts.99.gate_proj", "model.layers.83.mlp.experts.100.gate_proj", "model.layers.83.mlp.experts.101.gate_proj", "model.layers.83.mlp.experts.102.gate_proj", "model.layers.83.mlp.experts.103.gate_proj", "model.layers.83.mlp.experts.104.gate_proj", "model.layers.83.mlp.experts.105.gate_proj", "model.layers.83.mlp.experts.106.gate_proj", "model.layers.83.mlp.experts.107.gate_proj", "model.layers.83.mlp.experts.108.gate_proj", "model.layers.83.mlp.experts.109.gate_proj", "model.layers.83.mlp.experts.110.gate_proj", "model.layers.83.mlp.experts.111.gate_proj", "model.layers.83.mlp.experts.112.gate_proj", "model.layers.83.mlp.experts.113.gate_proj", "model.layers.83.mlp.experts.114.gate_proj", "model.layers.83.mlp.experts.115.gate_proj", "model.layers.83.mlp.experts.116.gate_proj", "model.layers.83.mlp.experts.117.gate_proj", "model.layers.83.mlp.experts.118.gate_proj", "model.layers.83.mlp.experts.119.gate_proj", "model.layers.83.mlp.experts.120.gate_proj", "model.layers.83.mlp.experts.121.gate_proj", "model.layers.83.mlp.experts.122.gate_proj", "model.layers.83.mlp.experts.123.gate_proj", "model.layers.83.mlp.experts.124.gate_proj", "model.layers.83.mlp.experts.125.gate_proj", "model.layers.83.mlp.experts.126.gate_proj", "model.layers.83.mlp.experts.127.gate_proj", "model.layers.83.mlp.experts.128.gate_proj", "model.layers.83.mlp.experts.129.gate_proj", "model.layers.83.mlp.experts.130.gate_proj", "model.layers.83.mlp.experts.131.gate_proj", "model.layers.83.mlp.experts.132.gate_proj", "model.layers.83.mlp.experts.133.gate_proj", "model.layers.83.mlp.experts.134.gate_proj", "model.layers.83.mlp.experts.135.gate_proj", "model.layers.83.mlp.experts.136.gate_proj", "model.layers.83.mlp.experts.137.gate_proj", "model.layers.83.mlp.experts.138.gate_proj", "model.layers.83.mlp.experts.139.gate_proj", "model.layers.83.mlp.experts.140.gate_proj", "model.layers.83.mlp.experts.141.gate_proj", "model.layers.83.mlp.experts.142.gate_proj", "model.layers.83.mlp.experts.143.gate_proj", "model.layers.83.mlp.experts.144.gate_proj", "model.layers.83.mlp.experts.145.gate_proj", "model.layers.83.mlp.experts.146.gate_proj", "model.layers.83.mlp.experts.147.gate_proj", "model.layers.83.mlp.experts.148.gate_proj", "model.layers.83.mlp.experts.149.gate_proj", "model.layers.83.mlp.experts.150.gate_proj", "model.layers.83.mlp.experts.151.gate_proj", "model.layers.83.mlp.experts.152.gate_proj", "model.layers.83.mlp.experts.153.gate_proj", "model.layers.83.mlp.experts.154.gate_proj", "model.layers.83.mlp.experts.155.gate_proj", "model.layers.83.mlp.experts.156.gate_proj", "model.layers.83.mlp.experts.157.gate_proj", "model.layers.83.mlp.experts.158.gate_proj", "model.layers.83.mlp.experts.159.gate_proj", "model.layers.83.mlp.experts.0.up_proj", "model.layers.83.mlp.experts.1.up_proj", "model.layers.83.mlp.experts.2.up_proj", "model.layers.83.mlp.experts.3.up_proj", "model.layers.83.mlp.experts.4.up_proj", "model.layers.83.mlp.experts.5.up_proj", "model.layers.83.mlp.experts.6.up_proj", "model.layers.83.mlp.experts.7.up_proj", "model.layers.83.mlp.experts.8.up_proj", "model.layers.83.mlp.experts.9.up_proj", "model.layers.83.mlp.experts.10.up_proj", "model.layers.83.mlp.experts.11.up_proj", "model.layers.83.mlp.experts.12.up_proj", "model.layers.83.mlp.experts.13.up_proj", "model.layers.83.mlp.experts.14.up_proj", "model.layers.83.mlp.experts.15.up_proj", "model.layers.83.mlp.experts.16.up_proj", "model.layers.83.mlp.experts.17.up_proj", "model.layers.83.mlp.experts.18.up_proj", "model.layers.83.mlp.experts.19.up_proj", "model.layers.83.mlp.experts.20.up_proj", "model.layers.83.mlp.experts.21.up_proj", "model.layers.83.mlp.experts.22.up_proj", "model.layers.83.mlp.experts.23.up_proj", "model.layers.83.mlp.experts.24.up_proj", "model.layers.83.mlp.experts.25.up_proj", "model.layers.83.mlp.experts.26.up_proj", "model.layers.83.mlp.experts.27.up_proj", "model.layers.83.mlp.experts.28.up_proj", "model.layers.83.mlp.experts.29.up_proj", "model.layers.83.mlp.experts.30.up_proj", "model.layers.83.mlp.experts.31.up_proj", "model.layers.83.mlp.experts.32.up_proj", "model.layers.83.mlp.experts.33.up_proj", "model.layers.83.mlp.experts.34.up_proj", "model.layers.83.mlp.experts.35.up_proj", "model.layers.83.mlp.experts.36.up_proj", "model.layers.83.mlp.experts.37.up_proj", "model.layers.83.mlp.experts.38.up_proj", "model.layers.83.mlp.experts.39.up_proj", "model.layers.83.mlp.experts.40.up_proj", "model.layers.83.mlp.experts.41.up_proj", "model.layers.83.mlp.experts.42.up_proj", "model.layers.83.mlp.experts.43.up_proj", "model.layers.83.mlp.experts.44.up_proj", "model.layers.83.mlp.experts.45.up_proj", "model.layers.83.mlp.experts.46.up_proj", "model.layers.83.mlp.experts.47.up_proj", "model.layers.83.mlp.experts.48.up_proj", "model.layers.83.mlp.experts.49.up_proj", "model.layers.83.mlp.experts.50.up_proj", "model.layers.83.mlp.experts.51.up_proj", "model.layers.83.mlp.experts.52.up_proj", "model.layers.83.mlp.experts.53.up_proj", "model.layers.83.mlp.experts.54.up_proj", "model.layers.83.mlp.experts.55.up_proj", "model.layers.83.mlp.experts.56.up_proj", "model.layers.83.mlp.experts.57.up_proj", "model.layers.83.mlp.experts.58.up_proj", "model.layers.83.mlp.experts.59.up_proj", "model.layers.83.mlp.experts.60.up_proj", "model.layers.83.mlp.experts.61.up_proj", "model.layers.83.mlp.experts.62.up_proj", "model.layers.83.mlp.experts.63.up_proj", "model.layers.83.mlp.experts.64.up_proj", "model.layers.83.mlp.experts.65.up_proj", "model.layers.83.mlp.experts.66.up_proj", "model.layers.83.mlp.experts.67.up_proj", "model.layers.83.mlp.experts.68.up_proj", "model.layers.83.mlp.experts.69.up_proj", "model.layers.83.mlp.experts.70.up_proj", "model.layers.83.mlp.experts.71.up_proj", "model.layers.83.mlp.experts.72.up_proj", "model.layers.83.mlp.experts.73.up_proj", "model.layers.83.mlp.experts.74.up_proj", "model.layers.83.mlp.experts.75.up_proj", "model.layers.83.mlp.experts.76.up_proj", "model.layers.83.mlp.experts.77.up_proj", "model.layers.83.mlp.experts.78.up_proj", "model.layers.83.mlp.experts.79.up_proj", "model.layers.83.mlp.experts.80.up_proj", "model.layers.83.mlp.experts.81.up_proj", "model.layers.83.mlp.experts.82.up_proj", "model.layers.83.mlp.experts.83.up_proj", "model.layers.83.mlp.experts.84.up_proj", "model.layers.83.mlp.experts.85.up_proj", "model.layers.83.mlp.experts.86.up_proj", "model.layers.83.mlp.experts.87.up_proj", "model.layers.83.mlp.experts.88.up_proj", "model.layers.83.mlp.experts.89.up_proj", "model.layers.83.mlp.experts.90.up_proj", "model.layers.83.mlp.experts.91.up_proj", "model.layers.83.mlp.experts.92.up_proj", "model.layers.83.mlp.experts.93.up_proj", "model.layers.83.mlp.experts.94.up_proj", "model.layers.83.mlp.experts.95.up_proj", "model.layers.83.mlp.experts.96.up_proj", "model.layers.83.mlp.experts.97.up_proj", "model.layers.83.mlp.experts.98.up_proj", "model.layers.83.mlp.experts.99.up_proj", "model.layers.83.mlp.experts.100.up_proj", "model.layers.83.mlp.experts.101.up_proj", "model.layers.83.mlp.experts.102.up_proj", "model.layers.83.mlp.experts.103.up_proj", "model.layers.83.mlp.experts.104.up_proj", "model.layers.83.mlp.experts.105.up_proj", "model.layers.83.mlp.experts.106.up_proj", "model.layers.83.mlp.experts.107.up_proj", "model.layers.83.mlp.experts.108.up_proj", "model.layers.83.mlp.experts.109.up_proj", "model.layers.83.mlp.experts.110.up_proj", "model.layers.83.mlp.experts.111.up_proj", "model.layers.83.mlp.experts.112.up_proj", "model.layers.83.mlp.experts.113.up_proj", "model.layers.83.mlp.experts.114.up_proj", "model.layers.83.mlp.experts.115.up_proj", "model.layers.83.mlp.experts.116.up_proj", "model.layers.83.mlp.experts.117.up_proj", "model.layers.83.mlp.experts.118.up_proj", "model.layers.83.mlp.experts.119.up_proj", "model.layers.83.mlp.experts.120.up_proj", "model.layers.83.mlp.experts.121.up_proj", "model.layers.83.mlp.experts.122.up_proj", "model.layers.83.mlp.experts.123.up_proj", "model.layers.83.mlp.experts.124.up_proj", "model.layers.83.mlp.experts.125.up_proj", "model.layers.83.mlp.experts.126.up_proj", "model.layers.83.mlp.experts.127.up_proj", "model.layers.83.mlp.experts.128.up_proj", "model.layers.83.mlp.experts.129.up_proj", "model.layers.83.mlp.experts.130.up_proj", "model.layers.83.mlp.experts.131.up_proj", "model.layers.83.mlp.experts.132.up_proj", "model.layers.83.mlp.experts.133.up_proj", "model.layers.83.mlp.experts.134.up_proj", "model.layers.83.mlp.experts.135.up_proj", "model.layers.83.mlp.experts.136.up_proj", "model.layers.83.mlp.experts.137.up_proj", "model.layers.83.mlp.experts.138.up_proj", "model.layers.83.mlp.experts.139.up_proj", "model.layers.83.mlp.experts.140.up_proj", "model.layers.83.mlp.experts.141.up_proj", "model.layers.83.mlp.experts.142.up_proj", "model.layers.83.mlp.experts.143.up_proj", "model.layers.83.mlp.experts.144.up_proj", "model.layers.83.mlp.experts.145.up_proj", "model.layers.83.mlp.experts.146.up_proj", "model.layers.83.mlp.experts.147.up_proj", "model.layers.83.mlp.experts.148.up_proj", "model.layers.83.mlp.experts.149.up_proj", "model.layers.83.mlp.experts.150.up_proj", "model.layers.83.mlp.experts.151.up_proj", "model.layers.83.mlp.experts.152.up_proj", "model.layers.83.mlp.experts.153.up_proj", "model.layers.83.mlp.experts.154.up_proj", "model.layers.83.mlp.experts.155.up_proj", "model.layers.83.mlp.experts.156.up_proj", "model.layers.83.mlp.experts.157.up_proj", "model.layers.83.mlp.experts.158.up_proj", "model.layers.83.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.6345642507090141e-06, "dbits": 2516582400 }, { "dkld": -1.7637433484195622e-05, "dbits": 5033164800 } ] }, { "idx": 500, "layers": [ "model.layers.83.mlp.experts.0.down_proj", "model.layers.83.mlp.experts.1.down_proj", "model.layers.83.mlp.experts.2.down_proj", "model.layers.83.mlp.experts.3.down_proj", "model.layers.83.mlp.experts.4.down_proj", "model.layers.83.mlp.experts.5.down_proj", "model.layers.83.mlp.experts.6.down_proj", "model.layers.83.mlp.experts.7.down_proj", "model.layers.83.mlp.experts.8.down_proj", "model.layers.83.mlp.experts.9.down_proj", "model.layers.83.mlp.experts.10.down_proj", "model.layers.83.mlp.experts.11.down_proj", "model.layers.83.mlp.experts.12.down_proj", "model.layers.83.mlp.experts.13.down_proj", "model.layers.83.mlp.experts.14.down_proj", "model.layers.83.mlp.experts.15.down_proj", "model.layers.83.mlp.experts.16.down_proj", "model.layers.83.mlp.experts.17.down_proj", "model.layers.83.mlp.experts.18.down_proj", "model.layers.83.mlp.experts.19.down_proj", "model.layers.83.mlp.experts.20.down_proj", "model.layers.83.mlp.experts.21.down_proj", "model.layers.83.mlp.experts.22.down_proj", "model.layers.83.mlp.experts.23.down_proj", "model.layers.83.mlp.experts.24.down_proj", "model.layers.83.mlp.experts.25.down_proj", "model.layers.83.mlp.experts.26.down_proj", "model.layers.83.mlp.experts.27.down_proj", "model.layers.83.mlp.experts.28.down_proj", "model.layers.83.mlp.experts.29.down_proj", "model.layers.83.mlp.experts.30.down_proj", "model.layers.83.mlp.experts.31.down_proj", "model.layers.83.mlp.experts.32.down_proj", "model.layers.83.mlp.experts.33.down_proj", "model.layers.83.mlp.experts.34.down_proj", "model.layers.83.mlp.experts.35.down_proj", "model.layers.83.mlp.experts.36.down_proj", "model.layers.83.mlp.experts.37.down_proj", "model.layers.83.mlp.experts.38.down_proj", "model.layers.83.mlp.experts.39.down_proj", "model.layers.83.mlp.experts.40.down_proj", "model.layers.83.mlp.experts.41.down_proj", "model.layers.83.mlp.experts.42.down_proj", "model.layers.83.mlp.experts.43.down_proj", "model.layers.83.mlp.experts.44.down_proj", "model.layers.83.mlp.experts.45.down_proj", "model.layers.83.mlp.experts.46.down_proj", "model.layers.83.mlp.experts.47.down_proj", "model.layers.83.mlp.experts.48.down_proj", "model.layers.83.mlp.experts.49.down_proj", "model.layers.83.mlp.experts.50.down_proj", "model.layers.83.mlp.experts.51.down_proj", "model.layers.83.mlp.experts.52.down_proj", "model.layers.83.mlp.experts.53.down_proj", "model.layers.83.mlp.experts.54.down_proj", "model.layers.83.mlp.experts.55.down_proj", "model.layers.83.mlp.experts.56.down_proj", "model.layers.83.mlp.experts.57.down_proj", "model.layers.83.mlp.experts.58.down_proj", "model.layers.83.mlp.experts.59.down_proj", "model.layers.83.mlp.experts.60.down_proj", "model.layers.83.mlp.experts.61.down_proj", "model.layers.83.mlp.experts.62.down_proj", "model.layers.83.mlp.experts.63.down_proj", "model.layers.83.mlp.experts.64.down_proj", "model.layers.83.mlp.experts.65.down_proj", "model.layers.83.mlp.experts.66.down_proj", "model.layers.83.mlp.experts.67.down_proj", "model.layers.83.mlp.experts.68.down_proj", "model.layers.83.mlp.experts.69.down_proj", "model.layers.83.mlp.experts.70.down_proj", "model.layers.83.mlp.experts.71.down_proj", "model.layers.83.mlp.experts.72.down_proj", "model.layers.83.mlp.experts.73.down_proj", "model.layers.83.mlp.experts.74.down_proj", "model.layers.83.mlp.experts.75.down_proj", "model.layers.83.mlp.experts.76.down_proj", "model.layers.83.mlp.experts.77.down_proj", "model.layers.83.mlp.experts.78.down_proj", "model.layers.83.mlp.experts.79.down_proj", "model.layers.83.mlp.experts.80.down_proj", "model.layers.83.mlp.experts.81.down_proj", "model.layers.83.mlp.experts.82.down_proj", "model.layers.83.mlp.experts.83.down_proj", "model.layers.83.mlp.experts.84.down_proj", "model.layers.83.mlp.experts.85.down_proj", "model.layers.83.mlp.experts.86.down_proj", "model.layers.83.mlp.experts.87.down_proj", "model.layers.83.mlp.experts.88.down_proj", "model.layers.83.mlp.experts.89.down_proj", "model.layers.83.mlp.experts.90.down_proj", "model.layers.83.mlp.experts.91.down_proj", "model.layers.83.mlp.experts.92.down_proj", "model.layers.83.mlp.experts.93.down_proj", "model.layers.83.mlp.experts.94.down_proj", "model.layers.83.mlp.experts.95.down_proj", "model.layers.83.mlp.experts.96.down_proj", "model.layers.83.mlp.experts.97.down_proj", "model.layers.83.mlp.experts.98.down_proj", "model.layers.83.mlp.experts.99.down_proj", "model.layers.83.mlp.experts.100.down_proj", "model.layers.83.mlp.experts.101.down_proj", "model.layers.83.mlp.experts.102.down_proj", "model.layers.83.mlp.experts.103.down_proj", "model.layers.83.mlp.experts.104.down_proj", "model.layers.83.mlp.experts.105.down_proj", "model.layers.83.mlp.experts.106.down_proj", "model.layers.83.mlp.experts.107.down_proj", "model.layers.83.mlp.experts.108.down_proj", "model.layers.83.mlp.experts.109.down_proj", "model.layers.83.mlp.experts.110.down_proj", "model.layers.83.mlp.experts.111.down_proj", "model.layers.83.mlp.experts.112.down_proj", "model.layers.83.mlp.experts.113.down_proj", "model.layers.83.mlp.experts.114.down_proj", "model.layers.83.mlp.experts.115.down_proj", "model.layers.83.mlp.experts.116.down_proj", "model.layers.83.mlp.experts.117.down_proj", "model.layers.83.mlp.experts.118.down_proj", "model.layers.83.mlp.experts.119.down_proj", "model.layers.83.mlp.experts.120.down_proj", "model.layers.83.mlp.experts.121.down_proj", "model.layers.83.mlp.experts.122.down_proj", "model.layers.83.mlp.experts.123.down_proj", "model.layers.83.mlp.experts.124.down_proj", "model.layers.83.mlp.experts.125.down_proj", "model.layers.83.mlp.experts.126.down_proj", "model.layers.83.mlp.experts.127.down_proj", "model.layers.83.mlp.experts.128.down_proj", "model.layers.83.mlp.experts.129.down_proj", "model.layers.83.mlp.experts.130.down_proj", "model.layers.83.mlp.experts.131.down_proj", "model.layers.83.mlp.experts.132.down_proj", "model.layers.83.mlp.experts.133.down_proj", "model.layers.83.mlp.experts.134.down_proj", "model.layers.83.mlp.experts.135.down_proj", "model.layers.83.mlp.experts.136.down_proj", "model.layers.83.mlp.experts.137.down_proj", "model.layers.83.mlp.experts.138.down_proj", "model.layers.83.mlp.experts.139.down_proj", "model.layers.83.mlp.experts.140.down_proj", "model.layers.83.mlp.experts.141.down_proj", "model.layers.83.mlp.experts.142.down_proj", "model.layers.83.mlp.experts.143.down_proj", "model.layers.83.mlp.experts.144.down_proj", "model.layers.83.mlp.experts.145.down_proj", "model.layers.83.mlp.experts.146.down_proj", "model.layers.83.mlp.experts.147.down_proj", "model.layers.83.mlp.experts.148.down_proj", "model.layers.83.mlp.experts.149.down_proj", "model.layers.83.mlp.experts.150.down_proj", "model.layers.83.mlp.experts.151.down_proj", "model.layers.83.mlp.experts.152.down_proj", "model.layers.83.mlp.experts.153.down_proj", "model.layers.83.mlp.experts.154.down_proj", "model.layers.83.mlp.experts.155.down_proj", "model.layers.83.mlp.experts.156.down_proj", "model.layers.83.mlp.experts.157.down_proj", "model.layers.83.mlp.experts.158.down_proj", "model.layers.83.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -5.662720650433453e-06, "dbits": 1258291200 }, { "dkld": -2.3521482944485056e-06, "dbits": 2516582400 } ] }, { "idx": 501, "layers": [ "model.layers.84.self_attn.q_proj" ], "candidates": [ { "dkld": -7.399173919111351e-05, "dbits": 62914560 }, { "dkld": -0.00010336800478398696, "dbits": 125829120 } ] }, { "idx": 502, "layers": [ "model.layers.84.self_attn.k_proj", "model.layers.84.self_attn.v_proj" ], "candidates": [ { "dkld": -0.00011954999063163926, "dbits": 10485760 }, { "dkld": -8.687709923833539e-05, "dbits": 20971520 } ] }, { "idx": 503, "layers": [ "model.layers.84.self_attn.o_proj" ], "candidates": [ { "dkld": 7.090345025063602e-06, "dbits": 62914560 }, { "dkld": -2.2786902263757097e-06, "dbits": 125829120 } ] }, { "idx": 504, "layers": [ "model.layers.84.mlp.shared_experts.gate_proj", "model.layers.84.mlp.shared_experts.up_proj", "model.layers.84.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 6.615577731281658e-05, "dbits": 23592960 }, { "dkld": 8.837536443024978e-05, "dbits": 47185920 } ] }, { "idx": 505, "layers": [ "model.layers.84.mlp.experts.0.gate_proj", "model.layers.84.mlp.experts.1.gate_proj", "model.layers.84.mlp.experts.2.gate_proj", "model.layers.84.mlp.experts.3.gate_proj", "model.layers.84.mlp.experts.4.gate_proj", "model.layers.84.mlp.experts.5.gate_proj", "model.layers.84.mlp.experts.6.gate_proj", "model.layers.84.mlp.experts.7.gate_proj", "model.layers.84.mlp.experts.8.gate_proj", "model.layers.84.mlp.experts.9.gate_proj", "model.layers.84.mlp.experts.10.gate_proj", "model.layers.84.mlp.experts.11.gate_proj", "model.layers.84.mlp.experts.12.gate_proj", "model.layers.84.mlp.experts.13.gate_proj", "model.layers.84.mlp.experts.14.gate_proj", "model.layers.84.mlp.experts.15.gate_proj", "model.layers.84.mlp.experts.16.gate_proj", "model.layers.84.mlp.experts.17.gate_proj", "model.layers.84.mlp.experts.18.gate_proj", "model.layers.84.mlp.experts.19.gate_proj", "model.layers.84.mlp.experts.20.gate_proj", "model.layers.84.mlp.experts.21.gate_proj", "model.layers.84.mlp.experts.22.gate_proj", "model.layers.84.mlp.experts.23.gate_proj", "model.layers.84.mlp.experts.24.gate_proj", "model.layers.84.mlp.experts.25.gate_proj", "model.layers.84.mlp.experts.26.gate_proj", "model.layers.84.mlp.experts.27.gate_proj", "model.layers.84.mlp.experts.28.gate_proj", "model.layers.84.mlp.experts.29.gate_proj", "model.layers.84.mlp.experts.30.gate_proj", "model.layers.84.mlp.experts.31.gate_proj", "model.layers.84.mlp.experts.32.gate_proj", "model.layers.84.mlp.experts.33.gate_proj", "model.layers.84.mlp.experts.34.gate_proj", "model.layers.84.mlp.experts.35.gate_proj", "model.layers.84.mlp.experts.36.gate_proj", "model.layers.84.mlp.experts.37.gate_proj", "model.layers.84.mlp.experts.38.gate_proj", "model.layers.84.mlp.experts.39.gate_proj", "model.layers.84.mlp.experts.40.gate_proj", "model.layers.84.mlp.experts.41.gate_proj", "model.layers.84.mlp.experts.42.gate_proj", "model.layers.84.mlp.experts.43.gate_proj", "model.layers.84.mlp.experts.44.gate_proj", "model.layers.84.mlp.experts.45.gate_proj", "model.layers.84.mlp.experts.46.gate_proj", "model.layers.84.mlp.experts.47.gate_proj", "model.layers.84.mlp.experts.48.gate_proj", "model.layers.84.mlp.experts.49.gate_proj", "model.layers.84.mlp.experts.50.gate_proj", "model.layers.84.mlp.experts.51.gate_proj", "model.layers.84.mlp.experts.52.gate_proj", "model.layers.84.mlp.experts.53.gate_proj", "model.layers.84.mlp.experts.54.gate_proj", "model.layers.84.mlp.experts.55.gate_proj", "model.layers.84.mlp.experts.56.gate_proj", "model.layers.84.mlp.experts.57.gate_proj", "model.layers.84.mlp.experts.58.gate_proj", "model.layers.84.mlp.experts.59.gate_proj", "model.layers.84.mlp.experts.60.gate_proj", "model.layers.84.mlp.experts.61.gate_proj", "model.layers.84.mlp.experts.62.gate_proj", "model.layers.84.mlp.experts.63.gate_proj", "model.layers.84.mlp.experts.64.gate_proj", "model.layers.84.mlp.experts.65.gate_proj", "model.layers.84.mlp.experts.66.gate_proj", "model.layers.84.mlp.experts.67.gate_proj", "model.layers.84.mlp.experts.68.gate_proj", "model.layers.84.mlp.experts.69.gate_proj", "model.layers.84.mlp.experts.70.gate_proj", "model.layers.84.mlp.experts.71.gate_proj", "model.layers.84.mlp.experts.72.gate_proj", "model.layers.84.mlp.experts.73.gate_proj", "model.layers.84.mlp.experts.74.gate_proj", "model.layers.84.mlp.experts.75.gate_proj", "model.layers.84.mlp.experts.76.gate_proj", "model.layers.84.mlp.experts.77.gate_proj", "model.layers.84.mlp.experts.78.gate_proj", "model.layers.84.mlp.experts.79.gate_proj", "model.layers.84.mlp.experts.80.gate_proj", "model.layers.84.mlp.experts.81.gate_proj", "model.layers.84.mlp.experts.82.gate_proj", "model.layers.84.mlp.experts.83.gate_proj", "model.layers.84.mlp.experts.84.gate_proj", "model.layers.84.mlp.experts.85.gate_proj", "model.layers.84.mlp.experts.86.gate_proj", "model.layers.84.mlp.experts.87.gate_proj", "model.layers.84.mlp.experts.88.gate_proj", "model.layers.84.mlp.experts.89.gate_proj", "model.layers.84.mlp.experts.90.gate_proj", "model.layers.84.mlp.experts.91.gate_proj", "model.layers.84.mlp.experts.92.gate_proj", "model.layers.84.mlp.experts.93.gate_proj", "model.layers.84.mlp.experts.94.gate_proj", "model.layers.84.mlp.experts.95.gate_proj", "model.layers.84.mlp.experts.96.gate_proj", "model.layers.84.mlp.experts.97.gate_proj", "model.layers.84.mlp.experts.98.gate_proj", "model.layers.84.mlp.experts.99.gate_proj", "model.layers.84.mlp.experts.100.gate_proj", "model.layers.84.mlp.experts.101.gate_proj", "model.layers.84.mlp.experts.102.gate_proj", "model.layers.84.mlp.experts.103.gate_proj", "model.layers.84.mlp.experts.104.gate_proj", "model.layers.84.mlp.experts.105.gate_proj", "model.layers.84.mlp.experts.106.gate_proj", "model.layers.84.mlp.experts.107.gate_proj", "model.layers.84.mlp.experts.108.gate_proj", "model.layers.84.mlp.experts.109.gate_proj", "model.layers.84.mlp.experts.110.gate_proj", "model.layers.84.mlp.experts.111.gate_proj", "model.layers.84.mlp.experts.112.gate_proj", "model.layers.84.mlp.experts.113.gate_proj", "model.layers.84.mlp.experts.114.gate_proj", "model.layers.84.mlp.experts.115.gate_proj", "model.layers.84.mlp.experts.116.gate_proj", "model.layers.84.mlp.experts.117.gate_proj", "model.layers.84.mlp.experts.118.gate_proj", "model.layers.84.mlp.experts.119.gate_proj", "model.layers.84.mlp.experts.120.gate_proj", "model.layers.84.mlp.experts.121.gate_proj", "model.layers.84.mlp.experts.122.gate_proj", "model.layers.84.mlp.experts.123.gate_proj", "model.layers.84.mlp.experts.124.gate_proj", "model.layers.84.mlp.experts.125.gate_proj", "model.layers.84.mlp.experts.126.gate_proj", "model.layers.84.mlp.experts.127.gate_proj", "model.layers.84.mlp.experts.128.gate_proj", "model.layers.84.mlp.experts.129.gate_proj", "model.layers.84.mlp.experts.130.gate_proj", "model.layers.84.mlp.experts.131.gate_proj", "model.layers.84.mlp.experts.132.gate_proj", "model.layers.84.mlp.experts.133.gate_proj", "model.layers.84.mlp.experts.134.gate_proj", "model.layers.84.mlp.experts.135.gate_proj", "model.layers.84.mlp.experts.136.gate_proj", "model.layers.84.mlp.experts.137.gate_proj", "model.layers.84.mlp.experts.138.gate_proj", "model.layers.84.mlp.experts.139.gate_proj", "model.layers.84.mlp.experts.140.gate_proj", "model.layers.84.mlp.experts.141.gate_proj", "model.layers.84.mlp.experts.142.gate_proj", "model.layers.84.mlp.experts.143.gate_proj", "model.layers.84.mlp.experts.144.gate_proj", "model.layers.84.mlp.experts.145.gate_proj", "model.layers.84.mlp.experts.146.gate_proj", "model.layers.84.mlp.experts.147.gate_proj", "model.layers.84.mlp.experts.148.gate_proj", "model.layers.84.mlp.experts.149.gate_proj", "model.layers.84.mlp.experts.150.gate_proj", "model.layers.84.mlp.experts.151.gate_proj", "model.layers.84.mlp.experts.152.gate_proj", "model.layers.84.mlp.experts.153.gate_proj", "model.layers.84.mlp.experts.154.gate_proj", "model.layers.84.mlp.experts.155.gate_proj", "model.layers.84.mlp.experts.156.gate_proj", "model.layers.84.mlp.experts.157.gate_proj", "model.layers.84.mlp.experts.158.gate_proj", "model.layers.84.mlp.experts.159.gate_proj", "model.layers.84.mlp.experts.0.up_proj", "model.layers.84.mlp.experts.1.up_proj", "model.layers.84.mlp.experts.2.up_proj", "model.layers.84.mlp.experts.3.up_proj", "model.layers.84.mlp.experts.4.up_proj", "model.layers.84.mlp.experts.5.up_proj", "model.layers.84.mlp.experts.6.up_proj", "model.layers.84.mlp.experts.7.up_proj", "model.layers.84.mlp.experts.8.up_proj", "model.layers.84.mlp.experts.9.up_proj", "model.layers.84.mlp.experts.10.up_proj", "model.layers.84.mlp.experts.11.up_proj", "model.layers.84.mlp.experts.12.up_proj", "model.layers.84.mlp.experts.13.up_proj", "model.layers.84.mlp.experts.14.up_proj", "model.layers.84.mlp.experts.15.up_proj", "model.layers.84.mlp.experts.16.up_proj", "model.layers.84.mlp.experts.17.up_proj", "model.layers.84.mlp.experts.18.up_proj", "model.layers.84.mlp.experts.19.up_proj", "model.layers.84.mlp.experts.20.up_proj", "model.layers.84.mlp.experts.21.up_proj", "model.layers.84.mlp.experts.22.up_proj", "model.layers.84.mlp.experts.23.up_proj", "model.layers.84.mlp.experts.24.up_proj", "model.layers.84.mlp.experts.25.up_proj", "model.layers.84.mlp.experts.26.up_proj", "model.layers.84.mlp.experts.27.up_proj", "model.layers.84.mlp.experts.28.up_proj", "model.layers.84.mlp.experts.29.up_proj", "model.layers.84.mlp.experts.30.up_proj", "model.layers.84.mlp.experts.31.up_proj", "model.layers.84.mlp.experts.32.up_proj", "model.layers.84.mlp.experts.33.up_proj", "model.layers.84.mlp.experts.34.up_proj", "model.layers.84.mlp.experts.35.up_proj", "model.layers.84.mlp.experts.36.up_proj", "model.layers.84.mlp.experts.37.up_proj", "model.layers.84.mlp.experts.38.up_proj", "model.layers.84.mlp.experts.39.up_proj", "model.layers.84.mlp.experts.40.up_proj", "model.layers.84.mlp.experts.41.up_proj", "model.layers.84.mlp.experts.42.up_proj", "model.layers.84.mlp.experts.43.up_proj", "model.layers.84.mlp.experts.44.up_proj", "model.layers.84.mlp.experts.45.up_proj", "model.layers.84.mlp.experts.46.up_proj", "model.layers.84.mlp.experts.47.up_proj", "model.layers.84.mlp.experts.48.up_proj", "model.layers.84.mlp.experts.49.up_proj", "model.layers.84.mlp.experts.50.up_proj", "model.layers.84.mlp.experts.51.up_proj", "model.layers.84.mlp.experts.52.up_proj", "model.layers.84.mlp.experts.53.up_proj", "model.layers.84.mlp.experts.54.up_proj", "model.layers.84.mlp.experts.55.up_proj", "model.layers.84.mlp.experts.56.up_proj", "model.layers.84.mlp.experts.57.up_proj", "model.layers.84.mlp.experts.58.up_proj", "model.layers.84.mlp.experts.59.up_proj", "model.layers.84.mlp.experts.60.up_proj", "model.layers.84.mlp.experts.61.up_proj", "model.layers.84.mlp.experts.62.up_proj", "model.layers.84.mlp.experts.63.up_proj", "model.layers.84.mlp.experts.64.up_proj", "model.layers.84.mlp.experts.65.up_proj", "model.layers.84.mlp.experts.66.up_proj", "model.layers.84.mlp.experts.67.up_proj", "model.layers.84.mlp.experts.68.up_proj", "model.layers.84.mlp.experts.69.up_proj", "model.layers.84.mlp.experts.70.up_proj", "model.layers.84.mlp.experts.71.up_proj", "model.layers.84.mlp.experts.72.up_proj", "model.layers.84.mlp.experts.73.up_proj", "model.layers.84.mlp.experts.74.up_proj", "model.layers.84.mlp.experts.75.up_proj", "model.layers.84.mlp.experts.76.up_proj", "model.layers.84.mlp.experts.77.up_proj", "model.layers.84.mlp.experts.78.up_proj", "model.layers.84.mlp.experts.79.up_proj", "model.layers.84.mlp.experts.80.up_proj", "model.layers.84.mlp.experts.81.up_proj", "model.layers.84.mlp.experts.82.up_proj", "model.layers.84.mlp.experts.83.up_proj", "model.layers.84.mlp.experts.84.up_proj", "model.layers.84.mlp.experts.85.up_proj", "model.layers.84.mlp.experts.86.up_proj", "model.layers.84.mlp.experts.87.up_proj", "model.layers.84.mlp.experts.88.up_proj", "model.layers.84.mlp.experts.89.up_proj", "model.layers.84.mlp.experts.90.up_proj", "model.layers.84.mlp.experts.91.up_proj", "model.layers.84.mlp.experts.92.up_proj", "model.layers.84.mlp.experts.93.up_proj", "model.layers.84.mlp.experts.94.up_proj", "model.layers.84.mlp.experts.95.up_proj", "model.layers.84.mlp.experts.96.up_proj", "model.layers.84.mlp.experts.97.up_proj", "model.layers.84.mlp.experts.98.up_proj", "model.layers.84.mlp.experts.99.up_proj", "model.layers.84.mlp.experts.100.up_proj", "model.layers.84.mlp.experts.101.up_proj", "model.layers.84.mlp.experts.102.up_proj", "model.layers.84.mlp.experts.103.up_proj", "model.layers.84.mlp.experts.104.up_proj", "model.layers.84.mlp.experts.105.up_proj", "model.layers.84.mlp.experts.106.up_proj", "model.layers.84.mlp.experts.107.up_proj", "model.layers.84.mlp.experts.108.up_proj", "model.layers.84.mlp.experts.109.up_proj", "model.layers.84.mlp.experts.110.up_proj", "model.layers.84.mlp.experts.111.up_proj", "model.layers.84.mlp.experts.112.up_proj", "model.layers.84.mlp.experts.113.up_proj", "model.layers.84.mlp.experts.114.up_proj", "model.layers.84.mlp.experts.115.up_proj", "model.layers.84.mlp.experts.116.up_proj", "model.layers.84.mlp.experts.117.up_proj", "model.layers.84.mlp.experts.118.up_proj", "model.layers.84.mlp.experts.119.up_proj", "model.layers.84.mlp.experts.120.up_proj", "model.layers.84.mlp.experts.121.up_proj", "model.layers.84.mlp.experts.122.up_proj", "model.layers.84.mlp.experts.123.up_proj", "model.layers.84.mlp.experts.124.up_proj", "model.layers.84.mlp.experts.125.up_proj", "model.layers.84.mlp.experts.126.up_proj", "model.layers.84.mlp.experts.127.up_proj", "model.layers.84.mlp.experts.128.up_proj", "model.layers.84.mlp.experts.129.up_proj", "model.layers.84.mlp.experts.130.up_proj", "model.layers.84.mlp.experts.131.up_proj", "model.layers.84.mlp.experts.132.up_proj", "model.layers.84.mlp.experts.133.up_proj", "model.layers.84.mlp.experts.134.up_proj", "model.layers.84.mlp.experts.135.up_proj", "model.layers.84.mlp.experts.136.up_proj", "model.layers.84.mlp.experts.137.up_proj", "model.layers.84.mlp.experts.138.up_proj", "model.layers.84.mlp.experts.139.up_proj", "model.layers.84.mlp.experts.140.up_proj", "model.layers.84.mlp.experts.141.up_proj", "model.layers.84.mlp.experts.142.up_proj", "model.layers.84.mlp.experts.143.up_proj", "model.layers.84.mlp.experts.144.up_proj", "model.layers.84.mlp.experts.145.up_proj", "model.layers.84.mlp.experts.146.up_proj", "model.layers.84.mlp.experts.147.up_proj", "model.layers.84.mlp.experts.148.up_proj", "model.layers.84.mlp.experts.149.up_proj", "model.layers.84.mlp.experts.150.up_proj", "model.layers.84.mlp.experts.151.up_proj", "model.layers.84.mlp.experts.152.up_proj", "model.layers.84.mlp.experts.153.up_proj", "model.layers.84.mlp.experts.154.up_proj", "model.layers.84.mlp.experts.155.up_proj", "model.layers.84.mlp.experts.156.up_proj", "model.layers.84.mlp.experts.157.up_proj", "model.layers.84.mlp.experts.158.up_proj", "model.layers.84.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -2.3144017904996178e-05, "dbits": 2516582400 }, { "dkld": -2.8110248968003793e-05, "dbits": 5033164800 } ] }, { "idx": 506, "layers": [ "model.layers.84.mlp.experts.0.down_proj", "model.layers.84.mlp.experts.1.down_proj", "model.layers.84.mlp.experts.2.down_proj", "model.layers.84.mlp.experts.3.down_proj", "model.layers.84.mlp.experts.4.down_proj", "model.layers.84.mlp.experts.5.down_proj", "model.layers.84.mlp.experts.6.down_proj", "model.layers.84.mlp.experts.7.down_proj", "model.layers.84.mlp.experts.8.down_proj", "model.layers.84.mlp.experts.9.down_proj", "model.layers.84.mlp.experts.10.down_proj", "model.layers.84.mlp.experts.11.down_proj", "model.layers.84.mlp.experts.12.down_proj", "model.layers.84.mlp.experts.13.down_proj", "model.layers.84.mlp.experts.14.down_proj", "model.layers.84.mlp.experts.15.down_proj", "model.layers.84.mlp.experts.16.down_proj", "model.layers.84.mlp.experts.17.down_proj", "model.layers.84.mlp.experts.18.down_proj", "model.layers.84.mlp.experts.19.down_proj", "model.layers.84.mlp.experts.20.down_proj", "model.layers.84.mlp.experts.21.down_proj", "model.layers.84.mlp.experts.22.down_proj", "model.layers.84.mlp.experts.23.down_proj", "model.layers.84.mlp.experts.24.down_proj", "model.layers.84.mlp.experts.25.down_proj", "model.layers.84.mlp.experts.26.down_proj", "model.layers.84.mlp.experts.27.down_proj", "model.layers.84.mlp.experts.28.down_proj", "model.layers.84.mlp.experts.29.down_proj", "model.layers.84.mlp.experts.30.down_proj", "model.layers.84.mlp.experts.31.down_proj", "model.layers.84.mlp.experts.32.down_proj", "model.layers.84.mlp.experts.33.down_proj", "model.layers.84.mlp.experts.34.down_proj", "model.layers.84.mlp.experts.35.down_proj", "model.layers.84.mlp.experts.36.down_proj", "model.layers.84.mlp.experts.37.down_proj", "model.layers.84.mlp.experts.38.down_proj", "model.layers.84.mlp.experts.39.down_proj", "model.layers.84.mlp.experts.40.down_proj", "model.layers.84.mlp.experts.41.down_proj", "model.layers.84.mlp.experts.42.down_proj", "model.layers.84.mlp.experts.43.down_proj", "model.layers.84.mlp.experts.44.down_proj", "model.layers.84.mlp.experts.45.down_proj", "model.layers.84.mlp.experts.46.down_proj", "model.layers.84.mlp.experts.47.down_proj", "model.layers.84.mlp.experts.48.down_proj", "model.layers.84.mlp.experts.49.down_proj", "model.layers.84.mlp.experts.50.down_proj", "model.layers.84.mlp.experts.51.down_proj", "model.layers.84.mlp.experts.52.down_proj", "model.layers.84.mlp.experts.53.down_proj", "model.layers.84.mlp.experts.54.down_proj", "model.layers.84.mlp.experts.55.down_proj", "model.layers.84.mlp.experts.56.down_proj", "model.layers.84.mlp.experts.57.down_proj", "model.layers.84.mlp.experts.58.down_proj", "model.layers.84.mlp.experts.59.down_proj", "model.layers.84.mlp.experts.60.down_proj", "model.layers.84.mlp.experts.61.down_proj", "model.layers.84.mlp.experts.62.down_proj", "model.layers.84.mlp.experts.63.down_proj", "model.layers.84.mlp.experts.64.down_proj", "model.layers.84.mlp.experts.65.down_proj", "model.layers.84.mlp.experts.66.down_proj", "model.layers.84.mlp.experts.67.down_proj", "model.layers.84.mlp.experts.68.down_proj", "model.layers.84.mlp.experts.69.down_proj", "model.layers.84.mlp.experts.70.down_proj", "model.layers.84.mlp.experts.71.down_proj", "model.layers.84.mlp.experts.72.down_proj", "model.layers.84.mlp.experts.73.down_proj", "model.layers.84.mlp.experts.74.down_proj", "model.layers.84.mlp.experts.75.down_proj", "model.layers.84.mlp.experts.76.down_proj", "model.layers.84.mlp.experts.77.down_proj", "model.layers.84.mlp.experts.78.down_proj", "model.layers.84.mlp.experts.79.down_proj", "model.layers.84.mlp.experts.80.down_proj", "model.layers.84.mlp.experts.81.down_proj", "model.layers.84.mlp.experts.82.down_proj", "model.layers.84.mlp.experts.83.down_proj", "model.layers.84.mlp.experts.84.down_proj", "model.layers.84.mlp.experts.85.down_proj", "model.layers.84.mlp.experts.86.down_proj", "model.layers.84.mlp.experts.87.down_proj", "model.layers.84.mlp.experts.88.down_proj", "model.layers.84.mlp.experts.89.down_proj", "model.layers.84.mlp.experts.90.down_proj", "model.layers.84.mlp.experts.91.down_proj", "model.layers.84.mlp.experts.92.down_proj", "model.layers.84.mlp.experts.93.down_proj", "model.layers.84.mlp.experts.94.down_proj", "model.layers.84.mlp.experts.95.down_proj", "model.layers.84.mlp.experts.96.down_proj", "model.layers.84.mlp.experts.97.down_proj", "model.layers.84.mlp.experts.98.down_proj", "model.layers.84.mlp.experts.99.down_proj", "model.layers.84.mlp.experts.100.down_proj", "model.layers.84.mlp.experts.101.down_proj", "model.layers.84.mlp.experts.102.down_proj", "model.layers.84.mlp.experts.103.down_proj", "model.layers.84.mlp.experts.104.down_proj", "model.layers.84.mlp.experts.105.down_proj", "model.layers.84.mlp.experts.106.down_proj", "model.layers.84.mlp.experts.107.down_proj", "model.layers.84.mlp.experts.108.down_proj", "model.layers.84.mlp.experts.109.down_proj", "model.layers.84.mlp.experts.110.down_proj", "model.layers.84.mlp.experts.111.down_proj", "model.layers.84.mlp.experts.112.down_proj", "model.layers.84.mlp.experts.113.down_proj", "model.layers.84.mlp.experts.114.down_proj", "model.layers.84.mlp.experts.115.down_proj", "model.layers.84.mlp.experts.116.down_proj", "model.layers.84.mlp.experts.117.down_proj", "model.layers.84.mlp.experts.118.down_proj", "model.layers.84.mlp.experts.119.down_proj", "model.layers.84.mlp.experts.120.down_proj", "model.layers.84.mlp.experts.121.down_proj", "model.layers.84.mlp.experts.122.down_proj", "model.layers.84.mlp.experts.123.down_proj", "model.layers.84.mlp.experts.124.down_proj", "model.layers.84.mlp.experts.125.down_proj", "model.layers.84.mlp.experts.126.down_proj", "model.layers.84.mlp.experts.127.down_proj", "model.layers.84.mlp.experts.128.down_proj", "model.layers.84.mlp.experts.129.down_proj", "model.layers.84.mlp.experts.130.down_proj", "model.layers.84.mlp.experts.131.down_proj", "model.layers.84.mlp.experts.132.down_proj", "model.layers.84.mlp.experts.133.down_proj", "model.layers.84.mlp.experts.134.down_proj", "model.layers.84.mlp.experts.135.down_proj", "model.layers.84.mlp.experts.136.down_proj", "model.layers.84.mlp.experts.137.down_proj", "model.layers.84.mlp.experts.138.down_proj", "model.layers.84.mlp.experts.139.down_proj", "model.layers.84.mlp.experts.140.down_proj", "model.layers.84.mlp.experts.141.down_proj", "model.layers.84.mlp.experts.142.down_proj", "model.layers.84.mlp.experts.143.down_proj", "model.layers.84.mlp.experts.144.down_proj", "model.layers.84.mlp.experts.145.down_proj", "model.layers.84.mlp.experts.146.down_proj", "model.layers.84.mlp.experts.147.down_proj", "model.layers.84.mlp.experts.148.down_proj", "model.layers.84.mlp.experts.149.down_proj", "model.layers.84.mlp.experts.150.down_proj", "model.layers.84.mlp.experts.151.down_proj", "model.layers.84.mlp.experts.152.down_proj", "model.layers.84.mlp.experts.153.down_proj", "model.layers.84.mlp.experts.154.down_proj", "model.layers.84.mlp.experts.155.down_proj", "model.layers.84.mlp.experts.156.down_proj", "model.layers.84.mlp.experts.157.down_proj", "model.layers.84.mlp.experts.158.down_proj", "model.layers.84.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -2.971966750919819e-06, "dbits": 1258291200 }, { "dkld": -6.0968566685908054e-06, "dbits": 2516582400 } ] }, { "idx": 507, "layers": [ "model.layers.85.self_attn.q_proj" ], "candidates": [ { "dkld": -1.6789906658230824e-05, "dbits": 62914560 }, { "dkld": -7.946244440972666e-05, "dbits": 125829120 } ] }, { "idx": 508, "layers": [ "model.layers.85.self_attn.k_proj", "model.layers.85.self_attn.v_proj" ], "candidates": [ { "dkld": -0.0002520794980227937, "dbits": 10485760 }, { "dkld": -0.00027318759821355273, "dbits": 20971520 } ] }, { "idx": 509, "layers": [ "model.layers.85.self_attn.o_proj" ], "candidates": [ { "dkld": -7.134007755666902e-05, "dbits": 62914560 }, { "dkld": -7.316386327147449e-05, "dbits": 125829120 } ] }, { "idx": 510, "layers": [ "model.layers.85.mlp.shared_experts.gate_proj", "model.layers.85.mlp.shared_experts.up_proj", "model.layers.85.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 3.005419857800111e-05, "dbits": 23592960 }, { "dkld": 3.6919745616615166e-05, "dbits": 47185920 } ] }, { "idx": 511, "layers": [ "model.layers.85.mlp.experts.0.gate_proj", "model.layers.85.mlp.experts.1.gate_proj", "model.layers.85.mlp.experts.2.gate_proj", "model.layers.85.mlp.experts.3.gate_proj", "model.layers.85.mlp.experts.4.gate_proj", "model.layers.85.mlp.experts.5.gate_proj", "model.layers.85.mlp.experts.6.gate_proj", "model.layers.85.mlp.experts.7.gate_proj", "model.layers.85.mlp.experts.8.gate_proj", "model.layers.85.mlp.experts.9.gate_proj", "model.layers.85.mlp.experts.10.gate_proj", "model.layers.85.mlp.experts.11.gate_proj", "model.layers.85.mlp.experts.12.gate_proj", "model.layers.85.mlp.experts.13.gate_proj", "model.layers.85.mlp.experts.14.gate_proj", "model.layers.85.mlp.experts.15.gate_proj", "model.layers.85.mlp.experts.16.gate_proj", "model.layers.85.mlp.experts.17.gate_proj", "model.layers.85.mlp.experts.18.gate_proj", "model.layers.85.mlp.experts.19.gate_proj", "model.layers.85.mlp.experts.20.gate_proj", "model.layers.85.mlp.experts.21.gate_proj", "model.layers.85.mlp.experts.22.gate_proj", "model.layers.85.mlp.experts.23.gate_proj", "model.layers.85.mlp.experts.24.gate_proj", "model.layers.85.mlp.experts.25.gate_proj", "model.layers.85.mlp.experts.26.gate_proj", "model.layers.85.mlp.experts.27.gate_proj", "model.layers.85.mlp.experts.28.gate_proj", "model.layers.85.mlp.experts.29.gate_proj", "model.layers.85.mlp.experts.30.gate_proj", "model.layers.85.mlp.experts.31.gate_proj", "model.layers.85.mlp.experts.32.gate_proj", "model.layers.85.mlp.experts.33.gate_proj", "model.layers.85.mlp.experts.34.gate_proj", "model.layers.85.mlp.experts.35.gate_proj", "model.layers.85.mlp.experts.36.gate_proj", "model.layers.85.mlp.experts.37.gate_proj", "model.layers.85.mlp.experts.38.gate_proj", "model.layers.85.mlp.experts.39.gate_proj", "model.layers.85.mlp.experts.40.gate_proj", "model.layers.85.mlp.experts.41.gate_proj", "model.layers.85.mlp.experts.42.gate_proj", "model.layers.85.mlp.experts.43.gate_proj", "model.layers.85.mlp.experts.44.gate_proj", "model.layers.85.mlp.experts.45.gate_proj", "model.layers.85.mlp.experts.46.gate_proj", "model.layers.85.mlp.experts.47.gate_proj", "model.layers.85.mlp.experts.48.gate_proj", "model.layers.85.mlp.experts.49.gate_proj", "model.layers.85.mlp.experts.50.gate_proj", "model.layers.85.mlp.experts.51.gate_proj", "model.layers.85.mlp.experts.52.gate_proj", "model.layers.85.mlp.experts.53.gate_proj", "model.layers.85.mlp.experts.54.gate_proj", "model.layers.85.mlp.experts.55.gate_proj", "model.layers.85.mlp.experts.56.gate_proj", "model.layers.85.mlp.experts.57.gate_proj", "model.layers.85.mlp.experts.58.gate_proj", "model.layers.85.mlp.experts.59.gate_proj", "model.layers.85.mlp.experts.60.gate_proj", "model.layers.85.mlp.experts.61.gate_proj", "model.layers.85.mlp.experts.62.gate_proj", "model.layers.85.mlp.experts.63.gate_proj", "model.layers.85.mlp.experts.64.gate_proj", "model.layers.85.mlp.experts.65.gate_proj", "model.layers.85.mlp.experts.66.gate_proj", "model.layers.85.mlp.experts.67.gate_proj", "model.layers.85.mlp.experts.68.gate_proj", "model.layers.85.mlp.experts.69.gate_proj", "model.layers.85.mlp.experts.70.gate_proj", "model.layers.85.mlp.experts.71.gate_proj", "model.layers.85.mlp.experts.72.gate_proj", "model.layers.85.mlp.experts.73.gate_proj", "model.layers.85.mlp.experts.74.gate_proj", "model.layers.85.mlp.experts.75.gate_proj", "model.layers.85.mlp.experts.76.gate_proj", "model.layers.85.mlp.experts.77.gate_proj", "model.layers.85.mlp.experts.78.gate_proj", "model.layers.85.mlp.experts.79.gate_proj", "model.layers.85.mlp.experts.80.gate_proj", "model.layers.85.mlp.experts.81.gate_proj", "model.layers.85.mlp.experts.82.gate_proj", "model.layers.85.mlp.experts.83.gate_proj", "model.layers.85.mlp.experts.84.gate_proj", "model.layers.85.mlp.experts.85.gate_proj", "model.layers.85.mlp.experts.86.gate_proj", "model.layers.85.mlp.experts.87.gate_proj", "model.layers.85.mlp.experts.88.gate_proj", "model.layers.85.mlp.experts.89.gate_proj", "model.layers.85.mlp.experts.90.gate_proj", "model.layers.85.mlp.experts.91.gate_proj", "model.layers.85.mlp.experts.92.gate_proj", "model.layers.85.mlp.experts.93.gate_proj", "model.layers.85.mlp.experts.94.gate_proj", "model.layers.85.mlp.experts.95.gate_proj", "model.layers.85.mlp.experts.96.gate_proj", "model.layers.85.mlp.experts.97.gate_proj", "model.layers.85.mlp.experts.98.gate_proj", "model.layers.85.mlp.experts.99.gate_proj", "model.layers.85.mlp.experts.100.gate_proj", "model.layers.85.mlp.experts.101.gate_proj", "model.layers.85.mlp.experts.102.gate_proj", "model.layers.85.mlp.experts.103.gate_proj", "model.layers.85.mlp.experts.104.gate_proj", "model.layers.85.mlp.experts.105.gate_proj", "model.layers.85.mlp.experts.106.gate_proj", "model.layers.85.mlp.experts.107.gate_proj", "model.layers.85.mlp.experts.108.gate_proj", "model.layers.85.mlp.experts.109.gate_proj", "model.layers.85.mlp.experts.110.gate_proj", "model.layers.85.mlp.experts.111.gate_proj", "model.layers.85.mlp.experts.112.gate_proj", "model.layers.85.mlp.experts.113.gate_proj", "model.layers.85.mlp.experts.114.gate_proj", "model.layers.85.mlp.experts.115.gate_proj", "model.layers.85.mlp.experts.116.gate_proj", "model.layers.85.mlp.experts.117.gate_proj", "model.layers.85.mlp.experts.118.gate_proj", "model.layers.85.mlp.experts.119.gate_proj", "model.layers.85.mlp.experts.120.gate_proj", "model.layers.85.mlp.experts.121.gate_proj", "model.layers.85.mlp.experts.122.gate_proj", "model.layers.85.mlp.experts.123.gate_proj", "model.layers.85.mlp.experts.124.gate_proj", "model.layers.85.mlp.experts.125.gate_proj", "model.layers.85.mlp.experts.126.gate_proj", "model.layers.85.mlp.experts.127.gate_proj", "model.layers.85.mlp.experts.128.gate_proj", "model.layers.85.mlp.experts.129.gate_proj", "model.layers.85.mlp.experts.130.gate_proj", "model.layers.85.mlp.experts.131.gate_proj", "model.layers.85.mlp.experts.132.gate_proj", "model.layers.85.mlp.experts.133.gate_proj", "model.layers.85.mlp.experts.134.gate_proj", "model.layers.85.mlp.experts.135.gate_proj", "model.layers.85.mlp.experts.136.gate_proj", "model.layers.85.mlp.experts.137.gate_proj", "model.layers.85.mlp.experts.138.gate_proj", "model.layers.85.mlp.experts.139.gate_proj", "model.layers.85.mlp.experts.140.gate_proj", "model.layers.85.mlp.experts.141.gate_proj", "model.layers.85.mlp.experts.142.gate_proj", "model.layers.85.mlp.experts.143.gate_proj", "model.layers.85.mlp.experts.144.gate_proj", "model.layers.85.mlp.experts.145.gate_proj", "model.layers.85.mlp.experts.146.gate_proj", "model.layers.85.mlp.experts.147.gate_proj", "model.layers.85.mlp.experts.148.gate_proj", "model.layers.85.mlp.experts.149.gate_proj", "model.layers.85.mlp.experts.150.gate_proj", "model.layers.85.mlp.experts.151.gate_proj", "model.layers.85.mlp.experts.152.gate_proj", "model.layers.85.mlp.experts.153.gate_proj", "model.layers.85.mlp.experts.154.gate_proj", "model.layers.85.mlp.experts.155.gate_proj", "model.layers.85.mlp.experts.156.gate_proj", "model.layers.85.mlp.experts.157.gate_proj", "model.layers.85.mlp.experts.158.gate_proj", "model.layers.85.mlp.experts.159.gate_proj", "model.layers.85.mlp.experts.0.up_proj", "model.layers.85.mlp.experts.1.up_proj", "model.layers.85.mlp.experts.2.up_proj", "model.layers.85.mlp.experts.3.up_proj", "model.layers.85.mlp.experts.4.up_proj", "model.layers.85.mlp.experts.5.up_proj", "model.layers.85.mlp.experts.6.up_proj", "model.layers.85.mlp.experts.7.up_proj", "model.layers.85.mlp.experts.8.up_proj", "model.layers.85.mlp.experts.9.up_proj", "model.layers.85.mlp.experts.10.up_proj", "model.layers.85.mlp.experts.11.up_proj", "model.layers.85.mlp.experts.12.up_proj", "model.layers.85.mlp.experts.13.up_proj", "model.layers.85.mlp.experts.14.up_proj", "model.layers.85.mlp.experts.15.up_proj", "model.layers.85.mlp.experts.16.up_proj", "model.layers.85.mlp.experts.17.up_proj", "model.layers.85.mlp.experts.18.up_proj", "model.layers.85.mlp.experts.19.up_proj", "model.layers.85.mlp.experts.20.up_proj", "model.layers.85.mlp.experts.21.up_proj", "model.layers.85.mlp.experts.22.up_proj", "model.layers.85.mlp.experts.23.up_proj", "model.layers.85.mlp.experts.24.up_proj", "model.layers.85.mlp.experts.25.up_proj", "model.layers.85.mlp.experts.26.up_proj", "model.layers.85.mlp.experts.27.up_proj", "model.layers.85.mlp.experts.28.up_proj", "model.layers.85.mlp.experts.29.up_proj", "model.layers.85.mlp.experts.30.up_proj", "model.layers.85.mlp.experts.31.up_proj", "model.layers.85.mlp.experts.32.up_proj", "model.layers.85.mlp.experts.33.up_proj", "model.layers.85.mlp.experts.34.up_proj", "model.layers.85.mlp.experts.35.up_proj", "model.layers.85.mlp.experts.36.up_proj", "model.layers.85.mlp.experts.37.up_proj", "model.layers.85.mlp.experts.38.up_proj", "model.layers.85.mlp.experts.39.up_proj", "model.layers.85.mlp.experts.40.up_proj", "model.layers.85.mlp.experts.41.up_proj", "model.layers.85.mlp.experts.42.up_proj", "model.layers.85.mlp.experts.43.up_proj", "model.layers.85.mlp.experts.44.up_proj", "model.layers.85.mlp.experts.45.up_proj", "model.layers.85.mlp.experts.46.up_proj", "model.layers.85.mlp.experts.47.up_proj", "model.layers.85.mlp.experts.48.up_proj", "model.layers.85.mlp.experts.49.up_proj", "model.layers.85.mlp.experts.50.up_proj", "model.layers.85.mlp.experts.51.up_proj", "model.layers.85.mlp.experts.52.up_proj", "model.layers.85.mlp.experts.53.up_proj", "model.layers.85.mlp.experts.54.up_proj", "model.layers.85.mlp.experts.55.up_proj", "model.layers.85.mlp.experts.56.up_proj", "model.layers.85.mlp.experts.57.up_proj", "model.layers.85.mlp.experts.58.up_proj", "model.layers.85.mlp.experts.59.up_proj", "model.layers.85.mlp.experts.60.up_proj", "model.layers.85.mlp.experts.61.up_proj", "model.layers.85.mlp.experts.62.up_proj", "model.layers.85.mlp.experts.63.up_proj", "model.layers.85.mlp.experts.64.up_proj", "model.layers.85.mlp.experts.65.up_proj", "model.layers.85.mlp.experts.66.up_proj", "model.layers.85.mlp.experts.67.up_proj", "model.layers.85.mlp.experts.68.up_proj", "model.layers.85.mlp.experts.69.up_proj", "model.layers.85.mlp.experts.70.up_proj", "model.layers.85.mlp.experts.71.up_proj", "model.layers.85.mlp.experts.72.up_proj", "model.layers.85.mlp.experts.73.up_proj", "model.layers.85.mlp.experts.74.up_proj", "model.layers.85.mlp.experts.75.up_proj", "model.layers.85.mlp.experts.76.up_proj", "model.layers.85.mlp.experts.77.up_proj", "model.layers.85.mlp.experts.78.up_proj", "model.layers.85.mlp.experts.79.up_proj", "model.layers.85.mlp.experts.80.up_proj", "model.layers.85.mlp.experts.81.up_proj", "model.layers.85.mlp.experts.82.up_proj", "model.layers.85.mlp.experts.83.up_proj", "model.layers.85.mlp.experts.84.up_proj", "model.layers.85.mlp.experts.85.up_proj", "model.layers.85.mlp.experts.86.up_proj", "model.layers.85.mlp.experts.87.up_proj", "model.layers.85.mlp.experts.88.up_proj", "model.layers.85.mlp.experts.89.up_proj", "model.layers.85.mlp.experts.90.up_proj", "model.layers.85.mlp.experts.91.up_proj", "model.layers.85.mlp.experts.92.up_proj", "model.layers.85.mlp.experts.93.up_proj", "model.layers.85.mlp.experts.94.up_proj", "model.layers.85.mlp.experts.95.up_proj", "model.layers.85.mlp.experts.96.up_proj", "model.layers.85.mlp.experts.97.up_proj", "model.layers.85.mlp.experts.98.up_proj", "model.layers.85.mlp.experts.99.up_proj", "model.layers.85.mlp.experts.100.up_proj", "model.layers.85.mlp.experts.101.up_proj", "model.layers.85.mlp.experts.102.up_proj", "model.layers.85.mlp.experts.103.up_proj", "model.layers.85.mlp.experts.104.up_proj", "model.layers.85.mlp.experts.105.up_proj", "model.layers.85.mlp.experts.106.up_proj", "model.layers.85.mlp.experts.107.up_proj", "model.layers.85.mlp.experts.108.up_proj", "model.layers.85.mlp.experts.109.up_proj", "model.layers.85.mlp.experts.110.up_proj", "model.layers.85.mlp.experts.111.up_proj", "model.layers.85.mlp.experts.112.up_proj", "model.layers.85.mlp.experts.113.up_proj", "model.layers.85.mlp.experts.114.up_proj", "model.layers.85.mlp.experts.115.up_proj", "model.layers.85.mlp.experts.116.up_proj", "model.layers.85.mlp.experts.117.up_proj", "model.layers.85.mlp.experts.118.up_proj", "model.layers.85.mlp.experts.119.up_proj", "model.layers.85.mlp.experts.120.up_proj", "model.layers.85.mlp.experts.121.up_proj", "model.layers.85.mlp.experts.122.up_proj", "model.layers.85.mlp.experts.123.up_proj", "model.layers.85.mlp.experts.124.up_proj", "model.layers.85.mlp.experts.125.up_proj", "model.layers.85.mlp.experts.126.up_proj", "model.layers.85.mlp.experts.127.up_proj", "model.layers.85.mlp.experts.128.up_proj", "model.layers.85.mlp.experts.129.up_proj", "model.layers.85.mlp.experts.130.up_proj", "model.layers.85.mlp.experts.131.up_proj", "model.layers.85.mlp.experts.132.up_proj", "model.layers.85.mlp.experts.133.up_proj", "model.layers.85.mlp.experts.134.up_proj", "model.layers.85.mlp.experts.135.up_proj", "model.layers.85.mlp.experts.136.up_proj", "model.layers.85.mlp.experts.137.up_proj", "model.layers.85.mlp.experts.138.up_proj", "model.layers.85.mlp.experts.139.up_proj", "model.layers.85.mlp.experts.140.up_proj", "model.layers.85.mlp.experts.141.up_proj", "model.layers.85.mlp.experts.142.up_proj", "model.layers.85.mlp.experts.143.up_proj", "model.layers.85.mlp.experts.144.up_proj", "model.layers.85.mlp.experts.145.up_proj", "model.layers.85.mlp.experts.146.up_proj", "model.layers.85.mlp.experts.147.up_proj", "model.layers.85.mlp.experts.148.up_proj", "model.layers.85.mlp.experts.149.up_proj", "model.layers.85.mlp.experts.150.up_proj", "model.layers.85.mlp.experts.151.up_proj", "model.layers.85.mlp.experts.152.up_proj", "model.layers.85.mlp.experts.153.up_proj", "model.layers.85.mlp.experts.154.up_proj", "model.layers.85.mlp.experts.155.up_proj", "model.layers.85.mlp.experts.156.up_proj", "model.layers.85.mlp.experts.157.up_proj", "model.layers.85.mlp.experts.158.up_proj", "model.layers.85.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 3.9885332807899215e-05, "dbits": 2516582400 }, { "dkld": 1.3671768829227535e-05, "dbits": 5033164800 } ] }, { "idx": 512, "layers": [ "model.layers.85.mlp.experts.0.down_proj", "model.layers.85.mlp.experts.1.down_proj", "model.layers.85.mlp.experts.2.down_proj", "model.layers.85.mlp.experts.3.down_proj", "model.layers.85.mlp.experts.4.down_proj", "model.layers.85.mlp.experts.5.down_proj", "model.layers.85.mlp.experts.6.down_proj", "model.layers.85.mlp.experts.7.down_proj", "model.layers.85.mlp.experts.8.down_proj", "model.layers.85.mlp.experts.9.down_proj", "model.layers.85.mlp.experts.10.down_proj", "model.layers.85.mlp.experts.11.down_proj", "model.layers.85.mlp.experts.12.down_proj", "model.layers.85.mlp.experts.13.down_proj", "model.layers.85.mlp.experts.14.down_proj", "model.layers.85.mlp.experts.15.down_proj", "model.layers.85.mlp.experts.16.down_proj", "model.layers.85.mlp.experts.17.down_proj", "model.layers.85.mlp.experts.18.down_proj", "model.layers.85.mlp.experts.19.down_proj", "model.layers.85.mlp.experts.20.down_proj", "model.layers.85.mlp.experts.21.down_proj", "model.layers.85.mlp.experts.22.down_proj", "model.layers.85.mlp.experts.23.down_proj", "model.layers.85.mlp.experts.24.down_proj", "model.layers.85.mlp.experts.25.down_proj", "model.layers.85.mlp.experts.26.down_proj", "model.layers.85.mlp.experts.27.down_proj", "model.layers.85.mlp.experts.28.down_proj", "model.layers.85.mlp.experts.29.down_proj", "model.layers.85.mlp.experts.30.down_proj", "model.layers.85.mlp.experts.31.down_proj", "model.layers.85.mlp.experts.32.down_proj", "model.layers.85.mlp.experts.33.down_proj", "model.layers.85.mlp.experts.34.down_proj", "model.layers.85.mlp.experts.35.down_proj", "model.layers.85.mlp.experts.36.down_proj", "model.layers.85.mlp.experts.37.down_proj", "model.layers.85.mlp.experts.38.down_proj", "model.layers.85.mlp.experts.39.down_proj", "model.layers.85.mlp.experts.40.down_proj", "model.layers.85.mlp.experts.41.down_proj", "model.layers.85.mlp.experts.42.down_proj", "model.layers.85.mlp.experts.43.down_proj", "model.layers.85.mlp.experts.44.down_proj", "model.layers.85.mlp.experts.45.down_proj", "model.layers.85.mlp.experts.46.down_proj", "model.layers.85.mlp.experts.47.down_proj", "model.layers.85.mlp.experts.48.down_proj", "model.layers.85.mlp.experts.49.down_proj", "model.layers.85.mlp.experts.50.down_proj", "model.layers.85.mlp.experts.51.down_proj", "model.layers.85.mlp.experts.52.down_proj", "model.layers.85.mlp.experts.53.down_proj", "model.layers.85.mlp.experts.54.down_proj", "model.layers.85.mlp.experts.55.down_proj", "model.layers.85.mlp.experts.56.down_proj", "model.layers.85.mlp.experts.57.down_proj", "model.layers.85.mlp.experts.58.down_proj", "model.layers.85.mlp.experts.59.down_proj", "model.layers.85.mlp.experts.60.down_proj", "model.layers.85.mlp.experts.61.down_proj", "model.layers.85.mlp.experts.62.down_proj", "model.layers.85.mlp.experts.63.down_proj", "model.layers.85.mlp.experts.64.down_proj", "model.layers.85.mlp.experts.65.down_proj", "model.layers.85.mlp.experts.66.down_proj", "model.layers.85.mlp.experts.67.down_proj", "model.layers.85.mlp.experts.68.down_proj", "model.layers.85.mlp.experts.69.down_proj", "model.layers.85.mlp.experts.70.down_proj", "model.layers.85.mlp.experts.71.down_proj", "model.layers.85.mlp.experts.72.down_proj", "model.layers.85.mlp.experts.73.down_proj", "model.layers.85.mlp.experts.74.down_proj", "model.layers.85.mlp.experts.75.down_proj", "model.layers.85.mlp.experts.76.down_proj", "model.layers.85.mlp.experts.77.down_proj", "model.layers.85.mlp.experts.78.down_proj", "model.layers.85.mlp.experts.79.down_proj", "model.layers.85.mlp.experts.80.down_proj", "model.layers.85.mlp.experts.81.down_proj", "model.layers.85.mlp.experts.82.down_proj", "model.layers.85.mlp.experts.83.down_proj", "model.layers.85.mlp.experts.84.down_proj", "model.layers.85.mlp.experts.85.down_proj", "model.layers.85.mlp.experts.86.down_proj", "model.layers.85.mlp.experts.87.down_proj", "model.layers.85.mlp.experts.88.down_proj", "model.layers.85.mlp.experts.89.down_proj", "model.layers.85.mlp.experts.90.down_proj", "model.layers.85.mlp.experts.91.down_proj", "model.layers.85.mlp.experts.92.down_proj", "model.layers.85.mlp.experts.93.down_proj", "model.layers.85.mlp.experts.94.down_proj", "model.layers.85.mlp.experts.95.down_proj", "model.layers.85.mlp.experts.96.down_proj", "model.layers.85.mlp.experts.97.down_proj", "model.layers.85.mlp.experts.98.down_proj", "model.layers.85.mlp.experts.99.down_proj", "model.layers.85.mlp.experts.100.down_proj", "model.layers.85.mlp.experts.101.down_proj", "model.layers.85.mlp.experts.102.down_proj", "model.layers.85.mlp.experts.103.down_proj", "model.layers.85.mlp.experts.104.down_proj", "model.layers.85.mlp.experts.105.down_proj", "model.layers.85.mlp.experts.106.down_proj", "model.layers.85.mlp.experts.107.down_proj", "model.layers.85.mlp.experts.108.down_proj", "model.layers.85.mlp.experts.109.down_proj", "model.layers.85.mlp.experts.110.down_proj", "model.layers.85.mlp.experts.111.down_proj", "model.layers.85.mlp.experts.112.down_proj", "model.layers.85.mlp.experts.113.down_proj", "model.layers.85.mlp.experts.114.down_proj", "model.layers.85.mlp.experts.115.down_proj", "model.layers.85.mlp.experts.116.down_proj", "model.layers.85.mlp.experts.117.down_proj", "model.layers.85.mlp.experts.118.down_proj", "model.layers.85.mlp.experts.119.down_proj", "model.layers.85.mlp.experts.120.down_proj", "model.layers.85.mlp.experts.121.down_proj", "model.layers.85.mlp.experts.122.down_proj", "model.layers.85.mlp.experts.123.down_proj", "model.layers.85.mlp.experts.124.down_proj", "model.layers.85.mlp.experts.125.down_proj", "model.layers.85.mlp.experts.126.down_proj", "model.layers.85.mlp.experts.127.down_proj", "model.layers.85.mlp.experts.128.down_proj", "model.layers.85.mlp.experts.129.down_proj", "model.layers.85.mlp.experts.130.down_proj", "model.layers.85.mlp.experts.131.down_proj", "model.layers.85.mlp.experts.132.down_proj", "model.layers.85.mlp.experts.133.down_proj", "model.layers.85.mlp.experts.134.down_proj", "model.layers.85.mlp.experts.135.down_proj", "model.layers.85.mlp.experts.136.down_proj", "model.layers.85.mlp.experts.137.down_proj", "model.layers.85.mlp.experts.138.down_proj", "model.layers.85.mlp.experts.139.down_proj", "model.layers.85.mlp.experts.140.down_proj", "model.layers.85.mlp.experts.141.down_proj", "model.layers.85.mlp.experts.142.down_proj", "model.layers.85.mlp.experts.143.down_proj", "model.layers.85.mlp.experts.144.down_proj", "model.layers.85.mlp.experts.145.down_proj", "model.layers.85.mlp.experts.146.down_proj", "model.layers.85.mlp.experts.147.down_proj", "model.layers.85.mlp.experts.148.down_proj", "model.layers.85.mlp.experts.149.down_proj", "model.layers.85.mlp.experts.150.down_proj", "model.layers.85.mlp.experts.151.down_proj", "model.layers.85.mlp.experts.152.down_proj", "model.layers.85.mlp.experts.153.down_proj", "model.layers.85.mlp.experts.154.down_proj", "model.layers.85.mlp.experts.155.down_proj", "model.layers.85.mlp.experts.156.down_proj", "model.layers.85.mlp.experts.157.down_proj", "model.layers.85.mlp.experts.158.down_proj", "model.layers.85.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 7.169763557614284e-06, "dbits": 1258291200 }, { "dkld": -8.679856546222123e-06, "dbits": 2516582400 } ] }, { "idx": 513, "layers": [ "model.layers.86.self_attn.q_proj" ], "candidates": [ { "dkld": 1.5895580872896803e-06, "dbits": 62914560 }, { "dkld": -3.115776926278929e-05, "dbits": 125829120 } ] }, { "idx": 514, "layers": [ "model.layers.86.self_attn.k_proj", "model.layers.86.self_attn.v_proj" ], "candidates": [ { "dkld": -0.00011442233808338538, "dbits": 10485760 }, { "dkld": -0.00012855259701609507, "dbits": 20971520 } ] }, { "idx": 515, "layers": [ "model.layers.86.self_attn.o_proj" ], "candidates": [ { "dkld": -0.00012592468410730327, "dbits": 62914560 }, { "dkld": -0.00011145258322358027, "dbits": 125829120 } ] }, { "idx": 516, "layers": [ "model.layers.86.mlp.shared_experts.gate_proj", "model.layers.86.mlp.shared_experts.up_proj", "model.layers.86.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": 1.1437269859016636e-05, "dbits": 23592960 }, { "dkld": -1.371721737086773e-05, "dbits": 47185920 } ] }, { "idx": 517, "layers": [ "model.layers.86.mlp.experts.0.gate_proj", "model.layers.86.mlp.experts.1.gate_proj", "model.layers.86.mlp.experts.2.gate_proj", "model.layers.86.mlp.experts.3.gate_proj", "model.layers.86.mlp.experts.4.gate_proj", "model.layers.86.mlp.experts.5.gate_proj", "model.layers.86.mlp.experts.6.gate_proj", "model.layers.86.mlp.experts.7.gate_proj", "model.layers.86.mlp.experts.8.gate_proj", "model.layers.86.mlp.experts.9.gate_proj", "model.layers.86.mlp.experts.10.gate_proj", "model.layers.86.mlp.experts.11.gate_proj", "model.layers.86.mlp.experts.12.gate_proj", "model.layers.86.mlp.experts.13.gate_proj", "model.layers.86.mlp.experts.14.gate_proj", "model.layers.86.mlp.experts.15.gate_proj", "model.layers.86.mlp.experts.16.gate_proj", "model.layers.86.mlp.experts.17.gate_proj", "model.layers.86.mlp.experts.18.gate_proj", "model.layers.86.mlp.experts.19.gate_proj", "model.layers.86.mlp.experts.20.gate_proj", "model.layers.86.mlp.experts.21.gate_proj", "model.layers.86.mlp.experts.22.gate_proj", "model.layers.86.mlp.experts.23.gate_proj", "model.layers.86.mlp.experts.24.gate_proj", "model.layers.86.mlp.experts.25.gate_proj", "model.layers.86.mlp.experts.26.gate_proj", "model.layers.86.mlp.experts.27.gate_proj", "model.layers.86.mlp.experts.28.gate_proj", "model.layers.86.mlp.experts.29.gate_proj", "model.layers.86.mlp.experts.30.gate_proj", "model.layers.86.mlp.experts.31.gate_proj", "model.layers.86.mlp.experts.32.gate_proj", "model.layers.86.mlp.experts.33.gate_proj", "model.layers.86.mlp.experts.34.gate_proj", "model.layers.86.mlp.experts.35.gate_proj", "model.layers.86.mlp.experts.36.gate_proj", "model.layers.86.mlp.experts.37.gate_proj", "model.layers.86.mlp.experts.38.gate_proj", "model.layers.86.mlp.experts.39.gate_proj", "model.layers.86.mlp.experts.40.gate_proj", "model.layers.86.mlp.experts.41.gate_proj", "model.layers.86.mlp.experts.42.gate_proj", "model.layers.86.mlp.experts.43.gate_proj", "model.layers.86.mlp.experts.44.gate_proj", "model.layers.86.mlp.experts.45.gate_proj", "model.layers.86.mlp.experts.46.gate_proj", "model.layers.86.mlp.experts.47.gate_proj", "model.layers.86.mlp.experts.48.gate_proj", "model.layers.86.mlp.experts.49.gate_proj", "model.layers.86.mlp.experts.50.gate_proj", "model.layers.86.mlp.experts.51.gate_proj", "model.layers.86.mlp.experts.52.gate_proj", "model.layers.86.mlp.experts.53.gate_proj", "model.layers.86.mlp.experts.54.gate_proj", "model.layers.86.mlp.experts.55.gate_proj", "model.layers.86.mlp.experts.56.gate_proj", "model.layers.86.mlp.experts.57.gate_proj", "model.layers.86.mlp.experts.58.gate_proj", "model.layers.86.mlp.experts.59.gate_proj", "model.layers.86.mlp.experts.60.gate_proj", "model.layers.86.mlp.experts.61.gate_proj", "model.layers.86.mlp.experts.62.gate_proj", "model.layers.86.mlp.experts.63.gate_proj", "model.layers.86.mlp.experts.64.gate_proj", "model.layers.86.mlp.experts.65.gate_proj", "model.layers.86.mlp.experts.66.gate_proj", "model.layers.86.mlp.experts.67.gate_proj", "model.layers.86.mlp.experts.68.gate_proj", "model.layers.86.mlp.experts.69.gate_proj", "model.layers.86.mlp.experts.70.gate_proj", "model.layers.86.mlp.experts.71.gate_proj", "model.layers.86.mlp.experts.72.gate_proj", "model.layers.86.mlp.experts.73.gate_proj", "model.layers.86.mlp.experts.74.gate_proj", "model.layers.86.mlp.experts.75.gate_proj", "model.layers.86.mlp.experts.76.gate_proj", "model.layers.86.mlp.experts.77.gate_proj", "model.layers.86.mlp.experts.78.gate_proj", "model.layers.86.mlp.experts.79.gate_proj", "model.layers.86.mlp.experts.80.gate_proj", "model.layers.86.mlp.experts.81.gate_proj", "model.layers.86.mlp.experts.82.gate_proj", "model.layers.86.mlp.experts.83.gate_proj", "model.layers.86.mlp.experts.84.gate_proj", "model.layers.86.mlp.experts.85.gate_proj", "model.layers.86.mlp.experts.86.gate_proj", "model.layers.86.mlp.experts.87.gate_proj", "model.layers.86.mlp.experts.88.gate_proj", "model.layers.86.mlp.experts.89.gate_proj", "model.layers.86.mlp.experts.90.gate_proj", "model.layers.86.mlp.experts.91.gate_proj", "model.layers.86.mlp.experts.92.gate_proj", "model.layers.86.mlp.experts.93.gate_proj", "model.layers.86.mlp.experts.94.gate_proj", "model.layers.86.mlp.experts.95.gate_proj", "model.layers.86.mlp.experts.96.gate_proj", "model.layers.86.mlp.experts.97.gate_proj", "model.layers.86.mlp.experts.98.gate_proj", "model.layers.86.mlp.experts.99.gate_proj", "model.layers.86.mlp.experts.100.gate_proj", "model.layers.86.mlp.experts.101.gate_proj", "model.layers.86.mlp.experts.102.gate_proj", "model.layers.86.mlp.experts.103.gate_proj", "model.layers.86.mlp.experts.104.gate_proj", "model.layers.86.mlp.experts.105.gate_proj", "model.layers.86.mlp.experts.106.gate_proj", "model.layers.86.mlp.experts.107.gate_proj", "model.layers.86.mlp.experts.108.gate_proj", "model.layers.86.mlp.experts.109.gate_proj", "model.layers.86.mlp.experts.110.gate_proj", "model.layers.86.mlp.experts.111.gate_proj", "model.layers.86.mlp.experts.112.gate_proj", "model.layers.86.mlp.experts.113.gate_proj", "model.layers.86.mlp.experts.114.gate_proj", "model.layers.86.mlp.experts.115.gate_proj", "model.layers.86.mlp.experts.116.gate_proj", "model.layers.86.mlp.experts.117.gate_proj", "model.layers.86.mlp.experts.118.gate_proj", "model.layers.86.mlp.experts.119.gate_proj", "model.layers.86.mlp.experts.120.gate_proj", "model.layers.86.mlp.experts.121.gate_proj", "model.layers.86.mlp.experts.122.gate_proj", "model.layers.86.mlp.experts.123.gate_proj", "model.layers.86.mlp.experts.124.gate_proj", "model.layers.86.mlp.experts.125.gate_proj", "model.layers.86.mlp.experts.126.gate_proj", "model.layers.86.mlp.experts.127.gate_proj", "model.layers.86.mlp.experts.128.gate_proj", "model.layers.86.mlp.experts.129.gate_proj", "model.layers.86.mlp.experts.130.gate_proj", "model.layers.86.mlp.experts.131.gate_proj", "model.layers.86.mlp.experts.132.gate_proj", "model.layers.86.mlp.experts.133.gate_proj", "model.layers.86.mlp.experts.134.gate_proj", "model.layers.86.mlp.experts.135.gate_proj", "model.layers.86.mlp.experts.136.gate_proj", "model.layers.86.mlp.experts.137.gate_proj", "model.layers.86.mlp.experts.138.gate_proj", "model.layers.86.mlp.experts.139.gate_proj", "model.layers.86.mlp.experts.140.gate_proj", "model.layers.86.mlp.experts.141.gate_proj", "model.layers.86.mlp.experts.142.gate_proj", "model.layers.86.mlp.experts.143.gate_proj", "model.layers.86.mlp.experts.144.gate_proj", "model.layers.86.mlp.experts.145.gate_proj", "model.layers.86.mlp.experts.146.gate_proj", "model.layers.86.mlp.experts.147.gate_proj", "model.layers.86.mlp.experts.148.gate_proj", "model.layers.86.mlp.experts.149.gate_proj", "model.layers.86.mlp.experts.150.gate_proj", "model.layers.86.mlp.experts.151.gate_proj", "model.layers.86.mlp.experts.152.gate_proj", "model.layers.86.mlp.experts.153.gate_proj", "model.layers.86.mlp.experts.154.gate_proj", "model.layers.86.mlp.experts.155.gate_proj", "model.layers.86.mlp.experts.156.gate_proj", "model.layers.86.mlp.experts.157.gate_proj", "model.layers.86.mlp.experts.158.gate_proj", "model.layers.86.mlp.experts.159.gate_proj", "model.layers.86.mlp.experts.0.up_proj", "model.layers.86.mlp.experts.1.up_proj", "model.layers.86.mlp.experts.2.up_proj", "model.layers.86.mlp.experts.3.up_proj", "model.layers.86.mlp.experts.4.up_proj", "model.layers.86.mlp.experts.5.up_proj", "model.layers.86.mlp.experts.6.up_proj", "model.layers.86.mlp.experts.7.up_proj", "model.layers.86.mlp.experts.8.up_proj", "model.layers.86.mlp.experts.9.up_proj", "model.layers.86.mlp.experts.10.up_proj", "model.layers.86.mlp.experts.11.up_proj", "model.layers.86.mlp.experts.12.up_proj", "model.layers.86.mlp.experts.13.up_proj", "model.layers.86.mlp.experts.14.up_proj", "model.layers.86.mlp.experts.15.up_proj", "model.layers.86.mlp.experts.16.up_proj", "model.layers.86.mlp.experts.17.up_proj", "model.layers.86.mlp.experts.18.up_proj", "model.layers.86.mlp.experts.19.up_proj", "model.layers.86.mlp.experts.20.up_proj", "model.layers.86.mlp.experts.21.up_proj", "model.layers.86.mlp.experts.22.up_proj", "model.layers.86.mlp.experts.23.up_proj", "model.layers.86.mlp.experts.24.up_proj", "model.layers.86.mlp.experts.25.up_proj", "model.layers.86.mlp.experts.26.up_proj", "model.layers.86.mlp.experts.27.up_proj", "model.layers.86.mlp.experts.28.up_proj", "model.layers.86.mlp.experts.29.up_proj", "model.layers.86.mlp.experts.30.up_proj", "model.layers.86.mlp.experts.31.up_proj", "model.layers.86.mlp.experts.32.up_proj", "model.layers.86.mlp.experts.33.up_proj", "model.layers.86.mlp.experts.34.up_proj", "model.layers.86.mlp.experts.35.up_proj", "model.layers.86.mlp.experts.36.up_proj", "model.layers.86.mlp.experts.37.up_proj", "model.layers.86.mlp.experts.38.up_proj", "model.layers.86.mlp.experts.39.up_proj", "model.layers.86.mlp.experts.40.up_proj", "model.layers.86.mlp.experts.41.up_proj", "model.layers.86.mlp.experts.42.up_proj", "model.layers.86.mlp.experts.43.up_proj", "model.layers.86.mlp.experts.44.up_proj", "model.layers.86.mlp.experts.45.up_proj", "model.layers.86.mlp.experts.46.up_proj", "model.layers.86.mlp.experts.47.up_proj", "model.layers.86.mlp.experts.48.up_proj", "model.layers.86.mlp.experts.49.up_proj", "model.layers.86.mlp.experts.50.up_proj", "model.layers.86.mlp.experts.51.up_proj", "model.layers.86.mlp.experts.52.up_proj", "model.layers.86.mlp.experts.53.up_proj", "model.layers.86.mlp.experts.54.up_proj", "model.layers.86.mlp.experts.55.up_proj", "model.layers.86.mlp.experts.56.up_proj", "model.layers.86.mlp.experts.57.up_proj", "model.layers.86.mlp.experts.58.up_proj", "model.layers.86.mlp.experts.59.up_proj", "model.layers.86.mlp.experts.60.up_proj", "model.layers.86.mlp.experts.61.up_proj", "model.layers.86.mlp.experts.62.up_proj", "model.layers.86.mlp.experts.63.up_proj", "model.layers.86.mlp.experts.64.up_proj", "model.layers.86.mlp.experts.65.up_proj", "model.layers.86.mlp.experts.66.up_proj", "model.layers.86.mlp.experts.67.up_proj", "model.layers.86.mlp.experts.68.up_proj", "model.layers.86.mlp.experts.69.up_proj", "model.layers.86.mlp.experts.70.up_proj", "model.layers.86.mlp.experts.71.up_proj", "model.layers.86.mlp.experts.72.up_proj", "model.layers.86.mlp.experts.73.up_proj", "model.layers.86.mlp.experts.74.up_proj", "model.layers.86.mlp.experts.75.up_proj", "model.layers.86.mlp.experts.76.up_proj", "model.layers.86.mlp.experts.77.up_proj", "model.layers.86.mlp.experts.78.up_proj", "model.layers.86.mlp.experts.79.up_proj", "model.layers.86.mlp.experts.80.up_proj", "model.layers.86.mlp.experts.81.up_proj", "model.layers.86.mlp.experts.82.up_proj", "model.layers.86.mlp.experts.83.up_proj", "model.layers.86.mlp.experts.84.up_proj", "model.layers.86.mlp.experts.85.up_proj", "model.layers.86.mlp.experts.86.up_proj", "model.layers.86.mlp.experts.87.up_proj", "model.layers.86.mlp.experts.88.up_proj", "model.layers.86.mlp.experts.89.up_proj", "model.layers.86.mlp.experts.90.up_proj", "model.layers.86.mlp.experts.91.up_proj", "model.layers.86.mlp.experts.92.up_proj", "model.layers.86.mlp.experts.93.up_proj", "model.layers.86.mlp.experts.94.up_proj", "model.layers.86.mlp.experts.95.up_proj", "model.layers.86.mlp.experts.96.up_proj", "model.layers.86.mlp.experts.97.up_proj", "model.layers.86.mlp.experts.98.up_proj", "model.layers.86.mlp.experts.99.up_proj", "model.layers.86.mlp.experts.100.up_proj", "model.layers.86.mlp.experts.101.up_proj", "model.layers.86.mlp.experts.102.up_proj", "model.layers.86.mlp.experts.103.up_proj", "model.layers.86.mlp.experts.104.up_proj", "model.layers.86.mlp.experts.105.up_proj", "model.layers.86.mlp.experts.106.up_proj", "model.layers.86.mlp.experts.107.up_proj", "model.layers.86.mlp.experts.108.up_proj", "model.layers.86.mlp.experts.109.up_proj", "model.layers.86.mlp.experts.110.up_proj", "model.layers.86.mlp.experts.111.up_proj", "model.layers.86.mlp.experts.112.up_proj", "model.layers.86.mlp.experts.113.up_proj", "model.layers.86.mlp.experts.114.up_proj", "model.layers.86.mlp.experts.115.up_proj", "model.layers.86.mlp.experts.116.up_proj", "model.layers.86.mlp.experts.117.up_proj", "model.layers.86.mlp.experts.118.up_proj", "model.layers.86.mlp.experts.119.up_proj", "model.layers.86.mlp.experts.120.up_proj", "model.layers.86.mlp.experts.121.up_proj", "model.layers.86.mlp.experts.122.up_proj", "model.layers.86.mlp.experts.123.up_proj", "model.layers.86.mlp.experts.124.up_proj", "model.layers.86.mlp.experts.125.up_proj", "model.layers.86.mlp.experts.126.up_proj", "model.layers.86.mlp.experts.127.up_proj", "model.layers.86.mlp.experts.128.up_proj", "model.layers.86.mlp.experts.129.up_proj", "model.layers.86.mlp.experts.130.up_proj", "model.layers.86.mlp.experts.131.up_proj", "model.layers.86.mlp.experts.132.up_proj", "model.layers.86.mlp.experts.133.up_proj", "model.layers.86.mlp.experts.134.up_proj", "model.layers.86.mlp.experts.135.up_proj", "model.layers.86.mlp.experts.136.up_proj", "model.layers.86.mlp.experts.137.up_proj", "model.layers.86.mlp.experts.138.up_proj", "model.layers.86.mlp.experts.139.up_proj", "model.layers.86.mlp.experts.140.up_proj", "model.layers.86.mlp.experts.141.up_proj", "model.layers.86.mlp.experts.142.up_proj", "model.layers.86.mlp.experts.143.up_proj", "model.layers.86.mlp.experts.144.up_proj", "model.layers.86.mlp.experts.145.up_proj", "model.layers.86.mlp.experts.146.up_proj", "model.layers.86.mlp.experts.147.up_proj", "model.layers.86.mlp.experts.148.up_proj", "model.layers.86.mlp.experts.149.up_proj", "model.layers.86.mlp.experts.150.up_proj", "model.layers.86.mlp.experts.151.up_proj", "model.layers.86.mlp.experts.152.up_proj", "model.layers.86.mlp.experts.153.up_proj", "model.layers.86.mlp.experts.154.up_proj", "model.layers.86.mlp.experts.155.up_proj", "model.layers.86.mlp.experts.156.up_proj", "model.layers.86.mlp.experts.157.up_proj", "model.layers.86.mlp.experts.158.up_proj", "model.layers.86.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.3947476185857556e-05, "dbits": 2516582400 }, { "dkld": -3.611054271459441e-05, "dbits": 5033164800 } ] }, { "idx": 518, "layers": [ "model.layers.86.mlp.experts.0.down_proj", "model.layers.86.mlp.experts.1.down_proj", "model.layers.86.mlp.experts.2.down_proj", "model.layers.86.mlp.experts.3.down_proj", "model.layers.86.mlp.experts.4.down_proj", "model.layers.86.mlp.experts.5.down_proj", "model.layers.86.mlp.experts.6.down_proj", "model.layers.86.mlp.experts.7.down_proj", "model.layers.86.mlp.experts.8.down_proj", "model.layers.86.mlp.experts.9.down_proj", "model.layers.86.mlp.experts.10.down_proj", "model.layers.86.mlp.experts.11.down_proj", "model.layers.86.mlp.experts.12.down_proj", "model.layers.86.mlp.experts.13.down_proj", "model.layers.86.mlp.experts.14.down_proj", "model.layers.86.mlp.experts.15.down_proj", "model.layers.86.mlp.experts.16.down_proj", "model.layers.86.mlp.experts.17.down_proj", "model.layers.86.mlp.experts.18.down_proj", "model.layers.86.mlp.experts.19.down_proj", "model.layers.86.mlp.experts.20.down_proj", "model.layers.86.mlp.experts.21.down_proj", "model.layers.86.mlp.experts.22.down_proj", "model.layers.86.mlp.experts.23.down_proj", "model.layers.86.mlp.experts.24.down_proj", "model.layers.86.mlp.experts.25.down_proj", "model.layers.86.mlp.experts.26.down_proj", "model.layers.86.mlp.experts.27.down_proj", "model.layers.86.mlp.experts.28.down_proj", "model.layers.86.mlp.experts.29.down_proj", "model.layers.86.mlp.experts.30.down_proj", "model.layers.86.mlp.experts.31.down_proj", "model.layers.86.mlp.experts.32.down_proj", "model.layers.86.mlp.experts.33.down_proj", "model.layers.86.mlp.experts.34.down_proj", "model.layers.86.mlp.experts.35.down_proj", "model.layers.86.mlp.experts.36.down_proj", "model.layers.86.mlp.experts.37.down_proj", "model.layers.86.mlp.experts.38.down_proj", "model.layers.86.mlp.experts.39.down_proj", "model.layers.86.mlp.experts.40.down_proj", "model.layers.86.mlp.experts.41.down_proj", "model.layers.86.mlp.experts.42.down_proj", "model.layers.86.mlp.experts.43.down_proj", "model.layers.86.mlp.experts.44.down_proj", "model.layers.86.mlp.experts.45.down_proj", "model.layers.86.mlp.experts.46.down_proj", "model.layers.86.mlp.experts.47.down_proj", "model.layers.86.mlp.experts.48.down_proj", "model.layers.86.mlp.experts.49.down_proj", "model.layers.86.mlp.experts.50.down_proj", "model.layers.86.mlp.experts.51.down_proj", "model.layers.86.mlp.experts.52.down_proj", "model.layers.86.mlp.experts.53.down_proj", "model.layers.86.mlp.experts.54.down_proj", "model.layers.86.mlp.experts.55.down_proj", "model.layers.86.mlp.experts.56.down_proj", "model.layers.86.mlp.experts.57.down_proj", "model.layers.86.mlp.experts.58.down_proj", "model.layers.86.mlp.experts.59.down_proj", "model.layers.86.mlp.experts.60.down_proj", "model.layers.86.mlp.experts.61.down_proj", "model.layers.86.mlp.experts.62.down_proj", "model.layers.86.mlp.experts.63.down_proj", "model.layers.86.mlp.experts.64.down_proj", "model.layers.86.mlp.experts.65.down_proj", "model.layers.86.mlp.experts.66.down_proj", "model.layers.86.mlp.experts.67.down_proj", "model.layers.86.mlp.experts.68.down_proj", "model.layers.86.mlp.experts.69.down_proj", "model.layers.86.mlp.experts.70.down_proj", "model.layers.86.mlp.experts.71.down_proj", "model.layers.86.mlp.experts.72.down_proj", "model.layers.86.mlp.experts.73.down_proj", "model.layers.86.mlp.experts.74.down_proj", "model.layers.86.mlp.experts.75.down_proj", "model.layers.86.mlp.experts.76.down_proj", "model.layers.86.mlp.experts.77.down_proj", "model.layers.86.mlp.experts.78.down_proj", "model.layers.86.mlp.experts.79.down_proj", "model.layers.86.mlp.experts.80.down_proj", "model.layers.86.mlp.experts.81.down_proj", "model.layers.86.mlp.experts.82.down_proj", "model.layers.86.mlp.experts.83.down_proj", "model.layers.86.mlp.experts.84.down_proj", "model.layers.86.mlp.experts.85.down_proj", "model.layers.86.mlp.experts.86.down_proj", "model.layers.86.mlp.experts.87.down_proj", "model.layers.86.mlp.experts.88.down_proj", "model.layers.86.mlp.experts.89.down_proj", "model.layers.86.mlp.experts.90.down_proj", "model.layers.86.mlp.experts.91.down_proj", "model.layers.86.mlp.experts.92.down_proj", "model.layers.86.mlp.experts.93.down_proj", "model.layers.86.mlp.experts.94.down_proj", "model.layers.86.mlp.experts.95.down_proj", "model.layers.86.mlp.experts.96.down_proj", "model.layers.86.mlp.experts.97.down_proj", "model.layers.86.mlp.experts.98.down_proj", "model.layers.86.mlp.experts.99.down_proj", "model.layers.86.mlp.experts.100.down_proj", "model.layers.86.mlp.experts.101.down_proj", "model.layers.86.mlp.experts.102.down_proj", "model.layers.86.mlp.experts.103.down_proj", "model.layers.86.mlp.experts.104.down_proj", "model.layers.86.mlp.experts.105.down_proj", "model.layers.86.mlp.experts.106.down_proj", "model.layers.86.mlp.experts.107.down_proj", "model.layers.86.mlp.experts.108.down_proj", "model.layers.86.mlp.experts.109.down_proj", "model.layers.86.mlp.experts.110.down_proj", "model.layers.86.mlp.experts.111.down_proj", "model.layers.86.mlp.experts.112.down_proj", "model.layers.86.mlp.experts.113.down_proj", "model.layers.86.mlp.experts.114.down_proj", "model.layers.86.mlp.experts.115.down_proj", "model.layers.86.mlp.experts.116.down_proj", "model.layers.86.mlp.experts.117.down_proj", "model.layers.86.mlp.experts.118.down_proj", "model.layers.86.mlp.experts.119.down_proj", "model.layers.86.mlp.experts.120.down_proj", "model.layers.86.mlp.experts.121.down_proj", "model.layers.86.mlp.experts.122.down_proj", "model.layers.86.mlp.experts.123.down_proj", "model.layers.86.mlp.experts.124.down_proj", "model.layers.86.mlp.experts.125.down_proj", "model.layers.86.mlp.experts.126.down_proj", "model.layers.86.mlp.experts.127.down_proj", "model.layers.86.mlp.experts.128.down_proj", "model.layers.86.mlp.experts.129.down_proj", "model.layers.86.mlp.experts.130.down_proj", "model.layers.86.mlp.experts.131.down_proj", "model.layers.86.mlp.experts.132.down_proj", "model.layers.86.mlp.experts.133.down_proj", "model.layers.86.mlp.experts.134.down_proj", "model.layers.86.mlp.experts.135.down_proj", "model.layers.86.mlp.experts.136.down_proj", "model.layers.86.mlp.experts.137.down_proj", "model.layers.86.mlp.experts.138.down_proj", "model.layers.86.mlp.experts.139.down_proj", "model.layers.86.mlp.experts.140.down_proj", "model.layers.86.mlp.experts.141.down_proj", "model.layers.86.mlp.experts.142.down_proj", "model.layers.86.mlp.experts.143.down_proj", "model.layers.86.mlp.experts.144.down_proj", "model.layers.86.mlp.experts.145.down_proj", "model.layers.86.mlp.experts.146.down_proj", "model.layers.86.mlp.experts.147.down_proj", "model.layers.86.mlp.experts.148.down_proj", "model.layers.86.mlp.experts.149.down_proj", "model.layers.86.mlp.experts.150.down_proj", "model.layers.86.mlp.experts.151.down_proj", "model.layers.86.mlp.experts.152.down_proj", "model.layers.86.mlp.experts.153.down_proj", "model.layers.86.mlp.experts.154.down_proj", "model.layers.86.mlp.experts.155.down_proj", "model.layers.86.mlp.experts.156.down_proj", "model.layers.86.mlp.experts.157.down_proj", "model.layers.86.mlp.experts.158.down_proj", "model.layers.86.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -8.82351305335656e-06, "dbits": 1258291200 }, { "dkld": -4.969025030731461e-06, "dbits": 2516582400 } ] }, { "idx": 519, "layers": [ "model.layers.87.self_attn.q_proj" ], "candidates": [ { "dkld": 9.768456220627525e-06, "dbits": 62914560 }, { "dkld": 1.0641291737570335e-06, "dbits": 125829120 } ] }, { "idx": 520, "layers": [ "model.layers.87.self_attn.k_proj", "model.layers.87.self_attn.v_proj" ], "candidates": [ { "dkld": -0.00013446349184960057, "dbits": 10485760 }, { "dkld": -0.000351743190549314, "dbits": 20971520 } ] }, { "idx": 521, "layers": [ "model.layers.87.self_attn.o_proj" ], "candidates": [ { "dkld": 2.246280200780132e-06, "dbits": 62914560 }, { "dkld": 3.4303870052113106e-06, "dbits": 125829120 } ] }, { "idx": 522, "layers": [ "model.layers.87.mlp.shared_experts.gate_proj", "model.layers.87.mlp.shared_experts.up_proj", "model.layers.87.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -1.4048069715499878e-05, "dbits": 23592960 }, { "dkld": -5.0191488116978905e-05, "dbits": 47185920 } ] }, { "idx": 523, "layers": [ "model.layers.87.mlp.experts.0.gate_proj", "model.layers.87.mlp.experts.1.gate_proj", "model.layers.87.mlp.experts.2.gate_proj", "model.layers.87.mlp.experts.3.gate_proj", "model.layers.87.mlp.experts.4.gate_proj", "model.layers.87.mlp.experts.5.gate_proj", "model.layers.87.mlp.experts.6.gate_proj", "model.layers.87.mlp.experts.7.gate_proj", "model.layers.87.mlp.experts.8.gate_proj", "model.layers.87.mlp.experts.9.gate_proj", "model.layers.87.mlp.experts.10.gate_proj", "model.layers.87.mlp.experts.11.gate_proj", "model.layers.87.mlp.experts.12.gate_proj", "model.layers.87.mlp.experts.13.gate_proj", "model.layers.87.mlp.experts.14.gate_proj", "model.layers.87.mlp.experts.15.gate_proj", "model.layers.87.mlp.experts.16.gate_proj", "model.layers.87.mlp.experts.17.gate_proj", "model.layers.87.mlp.experts.18.gate_proj", "model.layers.87.mlp.experts.19.gate_proj", "model.layers.87.mlp.experts.20.gate_proj", "model.layers.87.mlp.experts.21.gate_proj", "model.layers.87.mlp.experts.22.gate_proj", "model.layers.87.mlp.experts.23.gate_proj", "model.layers.87.mlp.experts.24.gate_proj", "model.layers.87.mlp.experts.25.gate_proj", "model.layers.87.mlp.experts.26.gate_proj", "model.layers.87.mlp.experts.27.gate_proj", "model.layers.87.mlp.experts.28.gate_proj", "model.layers.87.mlp.experts.29.gate_proj", "model.layers.87.mlp.experts.30.gate_proj", "model.layers.87.mlp.experts.31.gate_proj", "model.layers.87.mlp.experts.32.gate_proj", "model.layers.87.mlp.experts.33.gate_proj", "model.layers.87.mlp.experts.34.gate_proj", "model.layers.87.mlp.experts.35.gate_proj", "model.layers.87.mlp.experts.36.gate_proj", "model.layers.87.mlp.experts.37.gate_proj", "model.layers.87.mlp.experts.38.gate_proj", "model.layers.87.mlp.experts.39.gate_proj", "model.layers.87.mlp.experts.40.gate_proj", "model.layers.87.mlp.experts.41.gate_proj", "model.layers.87.mlp.experts.42.gate_proj", "model.layers.87.mlp.experts.43.gate_proj", "model.layers.87.mlp.experts.44.gate_proj", "model.layers.87.mlp.experts.45.gate_proj", "model.layers.87.mlp.experts.46.gate_proj", "model.layers.87.mlp.experts.47.gate_proj", "model.layers.87.mlp.experts.48.gate_proj", "model.layers.87.mlp.experts.49.gate_proj", "model.layers.87.mlp.experts.50.gate_proj", "model.layers.87.mlp.experts.51.gate_proj", "model.layers.87.mlp.experts.52.gate_proj", "model.layers.87.mlp.experts.53.gate_proj", "model.layers.87.mlp.experts.54.gate_proj", "model.layers.87.mlp.experts.55.gate_proj", "model.layers.87.mlp.experts.56.gate_proj", "model.layers.87.mlp.experts.57.gate_proj", "model.layers.87.mlp.experts.58.gate_proj", "model.layers.87.mlp.experts.59.gate_proj", "model.layers.87.mlp.experts.60.gate_proj", "model.layers.87.mlp.experts.61.gate_proj", "model.layers.87.mlp.experts.62.gate_proj", "model.layers.87.mlp.experts.63.gate_proj", "model.layers.87.mlp.experts.64.gate_proj", "model.layers.87.mlp.experts.65.gate_proj", "model.layers.87.mlp.experts.66.gate_proj", "model.layers.87.mlp.experts.67.gate_proj", "model.layers.87.mlp.experts.68.gate_proj", "model.layers.87.mlp.experts.69.gate_proj", "model.layers.87.mlp.experts.70.gate_proj", "model.layers.87.mlp.experts.71.gate_proj", "model.layers.87.mlp.experts.72.gate_proj", "model.layers.87.mlp.experts.73.gate_proj", "model.layers.87.mlp.experts.74.gate_proj", "model.layers.87.mlp.experts.75.gate_proj", "model.layers.87.mlp.experts.76.gate_proj", "model.layers.87.mlp.experts.77.gate_proj", "model.layers.87.mlp.experts.78.gate_proj", "model.layers.87.mlp.experts.79.gate_proj", "model.layers.87.mlp.experts.80.gate_proj", "model.layers.87.mlp.experts.81.gate_proj", "model.layers.87.mlp.experts.82.gate_proj", "model.layers.87.mlp.experts.83.gate_proj", "model.layers.87.mlp.experts.84.gate_proj", "model.layers.87.mlp.experts.85.gate_proj", "model.layers.87.mlp.experts.86.gate_proj", "model.layers.87.mlp.experts.87.gate_proj", "model.layers.87.mlp.experts.88.gate_proj", "model.layers.87.mlp.experts.89.gate_proj", "model.layers.87.mlp.experts.90.gate_proj", "model.layers.87.mlp.experts.91.gate_proj", "model.layers.87.mlp.experts.92.gate_proj", "model.layers.87.mlp.experts.93.gate_proj", "model.layers.87.mlp.experts.94.gate_proj", "model.layers.87.mlp.experts.95.gate_proj", "model.layers.87.mlp.experts.96.gate_proj", "model.layers.87.mlp.experts.97.gate_proj", "model.layers.87.mlp.experts.98.gate_proj", "model.layers.87.mlp.experts.99.gate_proj", "model.layers.87.mlp.experts.100.gate_proj", "model.layers.87.mlp.experts.101.gate_proj", "model.layers.87.mlp.experts.102.gate_proj", "model.layers.87.mlp.experts.103.gate_proj", "model.layers.87.mlp.experts.104.gate_proj", "model.layers.87.mlp.experts.105.gate_proj", "model.layers.87.mlp.experts.106.gate_proj", "model.layers.87.mlp.experts.107.gate_proj", "model.layers.87.mlp.experts.108.gate_proj", "model.layers.87.mlp.experts.109.gate_proj", "model.layers.87.mlp.experts.110.gate_proj", "model.layers.87.mlp.experts.111.gate_proj", "model.layers.87.mlp.experts.112.gate_proj", "model.layers.87.mlp.experts.113.gate_proj", "model.layers.87.mlp.experts.114.gate_proj", "model.layers.87.mlp.experts.115.gate_proj", "model.layers.87.mlp.experts.116.gate_proj", "model.layers.87.mlp.experts.117.gate_proj", "model.layers.87.mlp.experts.118.gate_proj", "model.layers.87.mlp.experts.119.gate_proj", "model.layers.87.mlp.experts.120.gate_proj", "model.layers.87.mlp.experts.121.gate_proj", "model.layers.87.mlp.experts.122.gate_proj", "model.layers.87.mlp.experts.123.gate_proj", "model.layers.87.mlp.experts.124.gate_proj", "model.layers.87.mlp.experts.125.gate_proj", "model.layers.87.mlp.experts.126.gate_proj", "model.layers.87.mlp.experts.127.gate_proj", "model.layers.87.mlp.experts.128.gate_proj", "model.layers.87.mlp.experts.129.gate_proj", "model.layers.87.mlp.experts.130.gate_proj", "model.layers.87.mlp.experts.131.gate_proj", "model.layers.87.mlp.experts.132.gate_proj", "model.layers.87.mlp.experts.133.gate_proj", "model.layers.87.mlp.experts.134.gate_proj", "model.layers.87.mlp.experts.135.gate_proj", "model.layers.87.mlp.experts.136.gate_proj", "model.layers.87.mlp.experts.137.gate_proj", "model.layers.87.mlp.experts.138.gate_proj", "model.layers.87.mlp.experts.139.gate_proj", "model.layers.87.mlp.experts.140.gate_proj", "model.layers.87.mlp.experts.141.gate_proj", "model.layers.87.mlp.experts.142.gate_proj", "model.layers.87.mlp.experts.143.gate_proj", "model.layers.87.mlp.experts.144.gate_proj", "model.layers.87.mlp.experts.145.gate_proj", "model.layers.87.mlp.experts.146.gate_proj", "model.layers.87.mlp.experts.147.gate_proj", "model.layers.87.mlp.experts.148.gate_proj", "model.layers.87.mlp.experts.149.gate_proj", "model.layers.87.mlp.experts.150.gate_proj", "model.layers.87.mlp.experts.151.gate_proj", "model.layers.87.mlp.experts.152.gate_proj", "model.layers.87.mlp.experts.153.gate_proj", "model.layers.87.mlp.experts.154.gate_proj", "model.layers.87.mlp.experts.155.gate_proj", "model.layers.87.mlp.experts.156.gate_proj", "model.layers.87.mlp.experts.157.gate_proj", "model.layers.87.mlp.experts.158.gate_proj", "model.layers.87.mlp.experts.159.gate_proj", "model.layers.87.mlp.experts.0.up_proj", "model.layers.87.mlp.experts.1.up_proj", "model.layers.87.mlp.experts.2.up_proj", "model.layers.87.mlp.experts.3.up_proj", "model.layers.87.mlp.experts.4.up_proj", "model.layers.87.mlp.experts.5.up_proj", "model.layers.87.mlp.experts.6.up_proj", "model.layers.87.mlp.experts.7.up_proj", "model.layers.87.mlp.experts.8.up_proj", "model.layers.87.mlp.experts.9.up_proj", "model.layers.87.mlp.experts.10.up_proj", "model.layers.87.mlp.experts.11.up_proj", "model.layers.87.mlp.experts.12.up_proj", "model.layers.87.mlp.experts.13.up_proj", "model.layers.87.mlp.experts.14.up_proj", "model.layers.87.mlp.experts.15.up_proj", "model.layers.87.mlp.experts.16.up_proj", "model.layers.87.mlp.experts.17.up_proj", "model.layers.87.mlp.experts.18.up_proj", "model.layers.87.mlp.experts.19.up_proj", "model.layers.87.mlp.experts.20.up_proj", "model.layers.87.mlp.experts.21.up_proj", "model.layers.87.mlp.experts.22.up_proj", "model.layers.87.mlp.experts.23.up_proj", "model.layers.87.mlp.experts.24.up_proj", "model.layers.87.mlp.experts.25.up_proj", "model.layers.87.mlp.experts.26.up_proj", "model.layers.87.mlp.experts.27.up_proj", "model.layers.87.mlp.experts.28.up_proj", "model.layers.87.mlp.experts.29.up_proj", "model.layers.87.mlp.experts.30.up_proj", "model.layers.87.mlp.experts.31.up_proj", "model.layers.87.mlp.experts.32.up_proj", "model.layers.87.mlp.experts.33.up_proj", "model.layers.87.mlp.experts.34.up_proj", "model.layers.87.mlp.experts.35.up_proj", "model.layers.87.mlp.experts.36.up_proj", "model.layers.87.mlp.experts.37.up_proj", "model.layers.87.mlp.experts.38.up_proj", "model.layers.87.mlp.experts.39.up_proj", "model.layers.87.mlp.experts.40.up_proj", "model.layers.87.mlp.experts.41.up_proj", "model.layers.87.mlp.experts.42.up_proj", "model.layers.87.mlp.experts.43.up_proj", "model.layers.87.mlp.experts.44.up_proj", "model.layers.87.mlp.experts.45.up_proj", "model.layers.87.mlp.experts.46.up_proj", "model.layers.87.mlp.experts.47.up_proj", "model.layers.87.mlp.experts.48.up_proj", "model.layers.87.mlp.experts.49.up_proj", "model.layers.87.mlp.experts.50.up_proj", "model.layers.87.mlp.experts.51.up_proj", "model.layers.87.mlp.experts.52.up_proj", "model.layers.87.mlp.experts.53.up_proj", "model.layers.87.mlp.experts.54.up_proj", "model.layers.87.mlp.experts.55.up_proj", "model.layers.87.mlp.experts.56.up_proj", "model.layers.87.mlp.experts.57.up_proj", "model.layers.87.mlp.experts.58.up_proj", "model.layers.87.mlp.experts.59.up_proj", "model.layers.87.mlp.experts.60.up_proj", "model.layers.87.mlp.experts.61.up_proj", "model.layers.87.mlp.experts.62.up_proj", "model.layers.87.mlp.experts.63.up_proj", "model.layers.87.mlp.experts.64.up_proj", "model.layers.87.mlp.experts.65.up_proj", "model.layers.87.mlp.experts.66.up_proj", "model.layers.87.mlp.experts.67.up_proj", "model.layers.87.mlp.experts.68.up_proj", "model.layers.87.mlp.experts.69.up_proj", "model.layers.87.mlp.experts.70.up_proj", "model.layers.87.mlp.experts.71.up_proj", "model.layers.87.mlp.experts.72.up_proj", "model.layers.87.mlp.experts.73.up_proj", "model.layers.87.mlp.experts.74.up_proj", "model.layers.87.mlp.experts.75.up_proj", "model.layers.87.mlp.experts.76.up_proj", "model.layers.87.mlp.experts.77.up_proj", "model.layers.87.mlp.experts.78.up_proj", "model.layers.87.mlp.experts.79.up_proj", "model.layers.87.mlp.experts.80.up_proj", "model.layers.87.mlp.experts.81.up_proj", "model.layers.87.mlp.experts.82.up_proj", "model.layers.87.mlp.experts.83.up_proj", "model.layers.87.mlp.experts.84.up_proj", "model.layers.87.mlp.experts.85.up_proj", "model.layers.87.mlp.experts.86.up_proj", "model.layers.87.mlp.experts.87.up_proj", "model.layers.87.mlp.experts.88.up_proj", "model.layers.87.mlp.experts.89.up_proj", "model.layers.87.mlp.experts.90.up_proj", "model.layers.87.mlp.experts.91.up_proj", "model.layers.87.mlp.experts.92.up_proj", "model.layers.87.mlp.experts.93.up_proj", "model.layers.87.mlp.experts.94.up_proj", "model.layers.87.mlp.experts.95.up_proj", "model.layers.87.mlp.experts.96.up_proj", "model.layers.87.mlp.experts.97.up_proj", "model.layers.87.mlp.experts.98.up_proj", "model.layers.87.mlp.experts.99.up_proj", "model.layers.87.mlp.experts.100.up_proj", "model.layers.87.mlp.experts.101.up_proj", "model.layers.87.mlp.experts.102.up_proj", "model.layers.87.mlp.experts.103.up_proj", "model.layers.87.mlp.experts.104.up_proj", "model.layers.87.mlp.experts.105.up_proj", "model.layers.87.mlp.experts.106.up_proj", "model.layers.87.mlp.experts.107.up_proj", "model.layers.87.mlp.experts.108.up_proj", "model.layers.87.mlp.experts.109.up_proj", "model.layers.87.mlp.experts.110.up_proj", "model.layers.87.mlp.experts.111.up_proj", "model.layers.87.mlp.experts.112.up_proj", "model.layers.87.mlp.experts.113.up_proj", "model.layers.87.mlp.experts.114.up_proj", "model.layers.87.mlp.experts.115.up_proj", "model.layers.87.mlp.experts.116.up_proj", "model.layers.87.mlp.experts.117.up_proj", "model.layers.87.mlp.experts.118.up_proj", "model.layers.87.mlp.experts.119.up_proj", "model.layers.87.mlp.experts.120.up_proj", "model.layers.87.mlp.experts.121.up_proj", "model.layers.87.mlp.experts.122.up_proj", "model.layers.87.mlp.experts.123.up_proj", "model.layers.87.mlp.experts.124.up_proj", "model.layers.87.mlp.experts.125.up_proj", "model.layers.87.mlp.experts.126.up_proj", "model.layers.87.mlp.experts.127.up_proj", "model.layers.87.mlp.experts.128.up_proj", "model.layers.87.mlp.experts.129.up_proj", "model.layers.87.mlp.experts.130.up_proj", "model.layers.87.mlp.experts.131.up_proj", "model.layers.87.mlp.experts.132.up_proj", "model.layers.87.mlp.experts.133.up_proj", "model.layers.87.mlp.experts.134.up_proj", "model.layers.87.mlp.experts.135.up_proj", "model.layers.87.mlp.experts.136.up_proj", "model.layers.87.mlp.experts.137.up_proj", "model.layers.87.mlp.experts.138.up_proj", "model.layers.87.mlp.experts.139.up_proj", "model.layers.87.mlp.experts.140.up_proj", "model.layers.87.mlp.experts.141.up_proj", "model.layers.87.mlp.experts.142.up_proj", "model.layers.87.mlp.experts.143.up_proj", "model.layers.87.mlp.experts.144.up_proj", "model.layers.87.mlp.experts.145.up_proj", "model.layers.87.mlp.experts.146.up_proj", "model.layers.87.mlp.experts.147.up_proj", "model.layers.87.mlp.experts.148.up_proj", "model.layers.87.mlp.experts.149.up_proj", "model.layers.87.mlp.experts.150.up_proj", "model.layers.87.mlp.experts.151.up_proj", "model.layers.87.mlp.experts.152.up_proj", "model.layers.87.mlp.experts.153.up_proj", "model.layers.87.mlp.experts.154.up_proj", "model.layers.87.mlp.experts.155.up_proj", "model.layers.87.mlp.experts.156.up_proj", "model.layers.87.mlp.experts.157.up_proj", "model.layers.87.mlp.experts.158.up_proj", "model.layers.87.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -9.883521124720226e-06, "dbits": 2516582400 }, { "dkld": -1.3417983427643082e-05, "dbits": 5033164800 } ] }, { "idx": 524, "layers": [ "model.layers.87.mlp.experts.0.down_proj", "model.layers.87.mlp.experts.1.down_proj", "model.layers.87.mlp.experts.2.down_proj", "model.layers.87.mlp.experts.3.down_proj", "model.layers.87.mlp.experts.4.down_proj", "model.layers.87.mlp.experts.5.down_proj", "model.layers.87.mlp.experts.6.down_proj", "model.layers.87.mlp.experts.7.down_proj", "model.layers.87.mlp.experts.8.down_proj", "model.layers.87.mlp.experts.9.down_proj", "model.layers.87.mlp.experts.10.down_proj", "model.layers.87.mlp.experts.11.down_proj", "model.layers.87.mlp.experts.12.down_proj", "model.layers.87.mlp.experts.13.down_proj", "model.layers.87.mlp.experts.14.down_proj", "model.layers.87.mlp.experts.15.down_proj", "model.layers.87.mlp.experts.16.down_proj", "model.layers.87.mlp.experts.17.down_proj", "model.layers.87.mlp.experts.18.down_proj", "model.layers.87.mlp.experts.19.down_proj", "model.layers.87.mlp.experts.20.down_proj", "model.layers.87.mlp.experts.21.down_proj", "model.layers.87.mlp.experts.22.down_proj", "model.layers.87.mlp.experts.23.down_proj", "model.layers.87.mlp.experts.24.down_proj", "model.layers.87.mlp.experts.25.down_proj", "model.layers.87.mlp.experts.26.down_proj", "model.layers.87.mlp.experts.27.down_proj", "model.layers.87.mlp.experts.28.down_proj", "model.layers.87.mlp.experts.29.down_proj", "model.layers.87.mlp.experts.30.down_proj", "model.layers.87.mlp.experts.31.down_proj", "model.layers.87.mlp.experts.32.down_proj", "model.layers.87.mlp.experts.33.down_proj", "model.layers.87.mlp.experts.34.down_proj", "model.layers.87.mlp.experts.35.down_proj", "model.layers.87.mlp.experts.36.down_proj", "model.layers.87.mlp.experts.37.down_proj", "model.layers.87.mlp.experts.38.down_proj", "model.layers.87.mlp.experts.39.down_proj", "model.layers.87.mlp.experts.40.down_proj", "model.layers.87.mlp.experts.41.down_proj", "model.layers.87.mlp.experts.42.down_proj", "model.layers.87.mlp.experts.43.down_proj", "model.layers.87.mlp.experts.44.down_proj", "model.layers.87.mlp.experts.45.down_proj", "model.layers.87.mlp.experts.46.down_proj", "model.layers.87.mlp.experts.47.down_proj", "model.layers.87.mlp.experts.48.down_proj", "model.layers.87.mlp.experts.49.down_proj", "model.layers.87.mlp.experts.50.down_proj", "model.layers.87.mlp.experts.51.down_proj", "model.layers.87.mlp.experts.52.down_proj", "model.layers.87.mlp.experts.53.down_proj", "model.layers.87.mlp.experts.54.down_proj", "model.layers.87.mlp.experts.55.down_proj", "model.layers.87.mlp.experts.56.down_proj", "model.layers.87.mlp.experts.57.down_proj", "model.layers.87.mlp.experts.58.down_proj", "model.layers.87.mlp.experts.59.down_proj", "model.layers.87.mlp.experts.60.down_proj", "model.layers.87.mlp.experts.61.down_proj", "model.layers.87.mlp.experts.62.down_proj", "model.layers.87.mlp.experts.63.down_proj", "model.layers.87.mlp.experts.64.down_proj", "model.layers.87.mlp.experts.65.down_proj", "model.layers.87.mlp.experts.66.down_proj", "model.layers.87.mlp.experts.67.down_proj", "model.layers.87.mlp.experts.68.down_proj", "model.layers.87.mlp.experts.69.down_proj", "model.layers.87.mlp.experts.70.down_proj", "model.layers.87.mlp.experts.71.down_proj", "model.layers.87.mlp.experts.72.down_proj", "model.layers.87.mlp.experts.73.down_proj", "model.layers.87.mlp.experts.74.down_proj", "model.layers.87.mlp.experts.75.down_proj", "model.layers.87.mlp.experts.76.down_proj", "model.layers.87.mlp.experts.77.down_proj", "model.layers.87.mlp.experts.78.down_proj", "model.layers.87.mlp.experts.79.down_proj", "model.layers.87.mlp.experts.80.down_proj", "model.layers.87.mlp.experts.81.down_proj", "model.layers.87.mlp.experts.82.down_proj", "model.layers.87.mlp.experts.83.down_proj", "model.layers.87.mlp.experts.84.down_proj", "model.layers.87.mlp.experts.85.down_proj", "model.layers.87.mlp.experts.86.down_proj", "model.layers.87.mlp.experts.87.down_proj", "model.layers.87.mlp.experts.88.down_proj", "model.layers.87.mlp.experts.89.down_proj", "model.layers.87.mlp.experts.90.down_proj", "model.layers.87.mlp.experts.91.down_proj", "model.layers.87.mlp.experts.92.down_proj", "model.layers.87.mlp.experts.93.down_proj", "model.layers.87.mlp.experts.94.down_proj", "model.layers.87.mlp.experts.95.down_proj", "model.layers.87.mlp.experts.96.down_proj", "model.layers.87.mlp.experts.97.down_proj", "model.layers.87.mlp.experts.98.down_proj", "model.layers.87.mlp.experts.99.down_proj", "model.layers.87.mlp.experts.100.down_proj", "model.layers.87.mlp.experts.101.down_proj", "model.layers.87.mlp.experts.102.down_proj", "model.layers.87.mlp.experts.103.down_proj", "model.layers.87.mlp.experts.104.down_proj", "model.layers.87.mlp.experts.105.down_proj", "model.layers.87.mlp.experts.106.down_proj", "model.layers.87.mlp.experts.107.down_proj", "model.layers.87.mlp.experts.108.down_proj", "model.layers.87.mlp.experts.109.down_proj", "model.layers.87.mlp.experts.110.down_proj", "model.layers.87.mlp.experts.111.down_proj", "model.layers.87.mlp.experts.112.down_proj", "model.layers.87.mlp.experts.113.down_proj", "model.layers.87.mlp.experts.114.down_proj", "model.layers.87.mlp.experts.115.down_proj", "model.layers.87.mlp.experts.116.down_proj", "model.layers.87.mlp.experts.117.down_proj", "model.layers.87.mlp.experts.118.down_proj", "model.layers.87.mlp.experts.119.down_proj", "model.layers.87.mlp.experts.120.down_proj", "model.layers.87.mlp.experts.121.down_proj", "model.layers.87.mlp.experts.122.down_proj", "model.layers.87.mlp.experts.123.down_proj", "model.layers.87.mlp.experts.124.down_proj", "model.layers.87.mlp.experts.125.down_proj", "model.layers.87.mlp.experts.126.down_proj", "model.layers.87.mlp.experts.127.down_proj", "model.layers.87.mlp.experts.128.down_proj", "model.layers.87.mlp.experts.129.down_proj", "model.layers.87.mlp.experts.130.down_proj", "model.layers.87.mlp.experts.131.down_proj", "model.layers.87.mlp.experts.132.down_proj", "model.layers.87.mlp.experts.133.down_proj", "model.layers.87.mlp.experts.134.down_proj", "model.layers.87.mlp.experts.135.down_proj", "model.layers.87.mlp.experts.136.down_proj", "model.layers.87.mlp.experts.137.down_proj", "model.layers.87.mlp.experts.138.down_proj", "model.layers.87.mlp.experts.139.down_proj", "model.layers.87.mlp.experts.140.down_proj", "model.layers.87.mlp.experts.141.down_proj", "model.layers.87.mlp.experts.142.down_proj", "model.layers.87.mlp.experts.143.down_proj", "model.layers.87.mlp.experts.144.down_proj", "model.layers.87.mlp.experts.145.down_proj", "model.layers.87.mlp.experts.146.down_proj", "model.layers.87.mlp.experts.147.down_proj", "model.layers.87.mlp.experts.148.down_proj", "model.layers.87.mlp.experts.149.down_proj", "model.layers.87.mlp.experts.150.down_proj", "model.layers.87.mlp.experts.151.down_proj", "model.layers.87.mlp.experts.152.down_proj", "model.layers.87.mlp.experts.153.down_proj", "model.layers.87.mlp.experts.154.down_proj", "model.layers.87.mlp.experts.155.down_proj", "model.layers.87.mlp.experts.156.down_proj", "model.layers.87.mlp.experts.157.down_proj", "model.layers.87.mlp.experts.158.down_proj", "model.layers.87.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": -1.0930700227618217e-05, "dbits": 1258291200 }, { "dkld": -7.5419899076209496e-06, "dbits": 2516582400 } ] }, { "idx": 525, "layers": [ "model.layers.88.self_attn.q_proj" ], "candidates": [ { "dkld": -2.325801178812946e-05, "dbits": 62914560 }, { "dkld": -7.758755236862702e-06, "dbits": 125829120 } ] }, { "idx": 526, "layers": [ "model.layers.88.self_attn.k_proj", "model.layers.88.self_attn.v_proj" ], "candidates": [ { "dkld": 1.8760422244669395e-05, "dbits": 10485760 }, { "dkld": -2.5858962908386837e-05, "dbits": 20971520 } ] }, { "idx": 527, "layers": [ "model.layers.88.self_attn.o_proj" ], "candidates": [ { "dkld": -4.794327542185714e-05, "dbits": 62914560 }, { "dkld": -4.2153336107729825e-05, "dbits": 125829120 } ] }, { "idx": 528, "layers": [ "model.layers.88.mlp.shared_experts.gate_proj", "model.layers.88.mlp.shared_experts.up_proj", "model.layers.88.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -1.2368429452180862e-05, "dbits": 23592960 }, { "dkld": -3.0140695162116787e-05, "dbits": 47185920 } ] }, { "idx": 529, "layers": [ "model.layers.88.mlp.experts.0.gate_proj", "model.layers.88.mlp.experts.1.gate_proj", "model.layers.88.mlp.experts.2.gate_proj", "model.layers.88.mlp.experts.3.gate_proj", "model.layers.88.mlp.experts.4.gate_proj", "model.layers.88.mlp.experts.5.gate_proj", "model.layers.88.mlp.experts.6.gate_proj", "model.layers.88.mlp.experts.7.gate_proj", "model.layers.88.mlp.experts.8.gate_proj", "model.layers.88.mlp.experts.9.gate_proj", "model.layers.88.mlp.experts.10.gate_proj", "model.layers.88.mlp.experts.11.gate_proj", "model.layers.88.mlp.experts.12.gate_proj", "model.layers.88.mlp.experts.13.gate_proj", "model.layers.88.mlp.experts.14.gate_proj", "model.layers.88.mlp.experts.15.gate_proj", "model.layers.88.mlp.experts.16.gate_proj", "model.layers.88.mlp.experts.17.gate_proj", "model.layers.88.mlp.experts.18.gate_proj", "model.layers.88.mlp.experts.19.gate_proj", "model.layers.88.mlp.experts.20.gate_proj", "model.layers.88.mlp.experts.21.gate_proj", "model.layers.88.mlp.experts.22.gate_proj", "model.layers.88.mlp.experts.23.gate_proj", "model.layers.88.mlp.experts.24.gate_proj", "model.layers.88.mlp.experts.25.gate_proj", "model.layers.88.mlp.experts.26.gate_proj", "model.layers.88.mlp.experts.27.gate_proj", "model.layers.88.mlp.experts.28.gate_proj", "model.layers.88.mlp.experts.29.gate_proj", "model.layers.88.mlp.experts.30.gate_proj", "model.layers.88.mlp.experts.31.gate_proj", "model.layers.88.mlp.experts.32.gate_proj", "model.layers.88.mlp.experts.33.gate_proj", "model.layers.88.mlp.experts.34.gate_proj", "model.layers.88.mlp.experts.35.gate_proj", "model.layers.88.mlp.experts.36.gate_proj", "model.layers.88.mlp.experts.37.gate_proj", "model.layers.88.mlp.experts.38.gate_proj", "model.layers.88.mlp.experts.39.gate_proj", "model.layers.88.mlp.experts.40.gate_proj", "model.layers.88.mlp.experts.41.gate_proj", "model.layers.88.mlp.experts.42.gate_proj", "model.layers.88.mlp.experts.43.gate_proj", "model.layers.88.mlp.experts.44.gate_proj", "model.layers.88.mlp.experts.45.gate_proj", "model.layers.88.mlp.experts.46.gate_proj", "model.layers.88.mlp.experts.47.gate_proj", "model.layers.88.mlp.experts.48.gate_proj", "model.layers.88.mlp.experts.49.gate_proj", "model.layers.88.mlp.experts.50.gate_proj", "model.layers.88.mlp.experts.51.gate_proj", "model.layers.88.mlp.experts.52.gate_proj", "model.layers.88.mlp.experts.53.gate_proj", "model.layers.88.mlp.experts.54.gate_proj", "model.layers.88.mlp.experts.55.gate_proj", "model.layers.88.mlp.experts.56.gate_proj", "model.layers.88.mlp.experts.57.gate_proj", "model.layers.88.mlp.experts.58.gate_proj", "model.layers.88.mlp.experts.59.gate_proj", "model.layers.88.mlp.experts.60.gate_proj", "model.layers.88.mlp.experts.61.gate_proj", "model.layers.88.mlp.experts.62.gate_proj", "model.layers.88.mlp.experts.63.gate_proj", "model.layers.88.mlp.experts.64.gate_proj", "model.layers.88.mlp.experts.65.gate_proj", "model.layers.88.mlp.experts.66.gate_proj", "model.layers.88.mlp.experts.67.gate_proj", "model.layers.88.mlp.experts.68.gate_proj", "model.layers.88.mlp.experts.69.gate_proj", "model.layers.88.mlp.experts.70.gate_proj", "model.layers.88.mlp.experts.71.gate_proj", "model.layers.88.mlp.experts.72.gate_proj", "model.layers.88.mlp.experts.73.gate_proj", "model.layers.88.mlp.experts.74.gate_proj", "model.layers.88.mlp.experts.75.gate_proj", "model.layers.88.mlp.experts.76.gate_proj", "model.layers.88.mlp.experts.77.gate_proj", "model.layers.88.mlp.experts.78.gate_proj", "model.layers.88.mlp.experts.79.gate_proj", "model.layers.88.mlp.experts.80.gate_proj", "model.layers.88.mlp.experts.81.gate_proj", "model.layers.88.mlp.experts.82.gate_proj", "model.layers.88.mlp.experts.83.gate_proj", "model.layers.88.mlp.experts.84.gate_proj", "model.layers.88.mlp.experts.85.gate_proj", "model.layers.88.mlp.experts.86.gate_proj", "model.layers.88.mlp.experts.87.gate_proj", "model.layers.88.mlp.experts.88.gate_proj", "model.layers.88.mlp.experts.89.gate_proj", "model.layers.88.mlp.experts.90.gate_proj", "model.layers.88.mlp.experts.91.gate_proj", "model.layers.88.mlp.experts.92.gate_proj", "model.layers.88.mlp.experts.93.gate_proj", "model.layers.88.mlp.experts.94.gate_proj", "model.layers.88.mlp.experts.95.gate_proj", "model.layers.88.mlp.experts.96.gate_proj", "model.layers.88.mlp.experts.97.gate_proj", "model.layers.88.mlp.experts.98.gate_proj", "model.layers.88.mlp.experts.99.gate_proj", "model.layers.88.mlp.experts.100.gate_proj", "model.layers.88.mlp.experts.101.gate_proj", "model.layers.88.mlp.experts.102.gate_proj", "model.layers.88.mlp.experts.103.gate_proj", "model.layers.88.mlp.experts.104.gate_proj", "model.layers.88.mlp.experts.105.gate_proj", "model.layers.88.mlp.experts.106.gate_proj", "model.layers.88.mlp.experts.107.gate_proj", "model.layers.88.mlp.experts.108.gate_proj", "model.layers.88.mlp.experts.109.gate_proj", "model.layers.88.mlp.experts.110.gate_proj", "model.layers.88.mlp.experts.111.gate_proj", "model.layers.88.mlp.experts.112.gate_proj", "model.layers.88.mlp.experts.113.gate_proj", "model.layers.88.mlp.experts.114.gate_proj", "model.layers.88.mlp.experts.115.gate_proj", "model.layers.88.mlp.experts.116.gate_proj", "model.layers.88.mlp.experts.117.gate_proj", "model.layers.88.mlp.experts.118.gate_proj", "model.layers.88.mlp.experts.119.gate_proj", "model.layers.88.mlp.experts.120.gate_proj", "model.layers.88.mlp.experts.121.gate_proj", "model.layers.88.mlp.experts.122.gate_proj", "model.layers.88.mlp.experts.123.gate_proj", "model.layers.88.mlp.experts.124.gate_proj", "model.layers.88.mlp.experts.125.gate_proj", "model.layers.88.mlp.experts.126.gate_proj", "model.layers.88.mlp.experts.127.gate_proj", "model.layers.88.mlp.experts.128.gate_proj", "model.layers.88.mlp.experts.129.gate_proj", "model.layers.88.mlp.experts.130.gate_proj", "model.layers.88.mlp.experts.131.gate_proj", "model.layers.88.mlp.experts.132.gate_proj", "model.layers.88.mlp.experts.133.gate_proj", "model.layers.88.mlp.experts.134.gate_proj", "model.layers.88.mlp.experts.135.gate_proj", "model.layers.88.mlp.experts.136.gate_proj", "model.layers.88.mlp.experts.137.gate_proj", "model.layers.88.mlp.experts.138.gate_proj", "model.layers.88.mlp.experts.139.gate_proj", "model.layers.88.mlp.experts.140.gate_proj", "model.layers.88.mlp.experts.141.gate_proj", "model.layers.88.mlp.experts.142.gate_proj", "model.layers.88.mlp.experts.143.gate_proj", "model.layers.88.mlp.experts.144.gate_proj", "model.layers.88.mlp.experts.145.gate_proj", "model.layers.88.mlp.experts.146.gate_proj", "model.layers.88.mlp.experts.147.gate_proj", "model.layers.88.mlp.experts.148.gate_proj", "model.layers.88.mlp.experts.149.gate_proj", "model.layers.88.mlp.experts.150.gate_proj", "model.layers.88.mlp.experts.151.gate_proj", "model.layers.88.mlp.experts.152.gate_proj", "model.layers.88.mlp.experts.153.gate_proj", "model.layers.88.mlp.experts.154.gate_proj", "model.layers.88.mlp.experts.155.gate_proj", "model.layers.88.mlp.experts.156.gate_proj", "model.layers.88.mlp.experts.157.gate_proj", "model.layers.88.mlp.experts.158.gate_proj", "model.layers.88.mlp.experts.159.gate_proj", "model.layers.88.mlp.experts.0.up_proj", "model.layers.88.mlp.experts.1.up_proj", "model.layers.88.mlp.experts.2.up_proj", "model.layers.88.mlp.experts.3.up_proj", "model.layers.88.mlp.experts.4.up_proj", "model.layers.88.mlp.experts.5.up_proj", "model.layers.88.mlp.experts.6.up_proj", "model.layers.88.mlp.experts.7.up_proj", "model.layers.88.mlp.experts.8.up_proj", "model.layers.88.mlp.experts.9.up_proj", "model.layers.88.mlp.experts.10.up_proj", "model.layers.88.mlp.experts.11.up_proj", "model.layers.88.mlp.experts.12.up_proj", "model.layers.88.mlp.experts.13.up_proj", "model.layers.88.mlp.experts.14.up_proj", "model.layers.88.mlp.experts.15.up_proj", "model.layers.88.mlp.experts.16.up_proj", "model.layers.88.mlp.experts.17.up_proj", "model.layers.88.mlp.experts.18.up_proj", "model.layers.88.mlp.experts.19.up_proj", "model.layers.88.mlp.experts.20.up_proj", "model.layers.88.mlp.experts.21.up_proj", "model.layers.88.mlp.experts.22.up_proj", "model.layers.88.mlp.experts.23.up_proj", "model.layers.88.mlp.experts.24.up_proj", "model.layers.88.mlp.experts.25.up_proj", "model.layers.88.mlp.experts.26.up_proj", "model.layers.88.mlp.experts.27.up_proj", "model.layers.88.mlp.experts.28.up_proj", "model.layers.88.mlp.experts.29.up_proj", "model.layers.88.mlp.experts.30.up_proj", "model.layers.88.mlp.experts.31.up_proj", "model.layers.88.mlp.experts.32.up_proj", "model.layers.88.mlp.experts.33.up_proj", "model.layers.88.mlp.experts.34.up_proj", "model.layers.88.mlp.experts.35.up_proj", "model.layers.88.mlp.experts.36.up_proj", "model.layers.88.mlp.experts.37.up_proj", "model.layers.88.mlp.experts.38.up_proj", "model.layers.88.mlp.experts.39.up_proj", "model.layers.88.mlp.experts.40.up_proj", "model.layers.88.mlp.experts.41.up_proj", "model.layers.88.mlp.experts.42.up_proj", "model.layers.88.mlp.experts.43.up_proj", "model.layers.88.mlp.experts.44.up_proj", "model.layers.88.mlp.experts.45.up_proj", "model.layers.88.mlp.experts.46.up_proj", "model.layers.88.mlp.experts.47.up_proj", "model.layers.88.mlp.experts.48.up_proj", "model.layers.88.mlp.experts.49.up_proj", "model.layers.88.mlp.experts.50.up_proj", "model.layers.88.mlp.experts.51.up_proj", "model.layers.88.mlp.experts.52.up_proj", "model.layers.88.mlp.experts.53.up_proj", "model.layers.88.mlp.experts.54.up_proj", "model.layers.88.mlp.experts.55.up_proj", "model.layers.88.mlp.experts.56.up_proj", "model.layers.88.mlp.experts.57.up_proj", "model.layers.88.mlp.experts.58.up_proj", "model.layers.88.mlp.experts.59.up_proj", "model.layers.88.mlp.experts.60.up_proj", "model.layers.88.mlp.experts.61.up_proj", "model.layers.88.mlp.experts.62.up_proj", "model.layers.88.mlp.experts.63.up_proj", "model.layers.88.mlp.experts.64.up_proj", "model.layers.88.mlp.experts.65.up_proj", "model.layers.88.mlp.experts.66.up_proj", "model.layers.88.mlp.experts.67.up_proj", "model.layers.88.mlp.experts.68.up_proj", "model.layers.88.mlp.experts.69.up_proj", "model.layers.88.mlp.experts.70.up_proj", "model.layers.88.mlp.experts.71.up_proj", "model.layers.88.mlp.experts.72.up_proj", "model.layers.88.mlp.experts.73.up_proj", "model.layers.88.mlp.experts.74.up_proj", "model.layers.88.mlp.experts.75.up_proj", "model.layers.88.mlp.experts.76.up_proj", "model.layers.88.mlp.experts.77.up_proj", "model.layers.88.mlp.experts.78.up_proj", "model.layers.88.mlp.experts.79.up_proj", "model.layers.88.mlp.experts.80.up_proj", "model.layers.88.mlp.experts.81.up_proj", "model.layers.88.mlp.experts.82.up_proj", "model.layers.88.mlp.experts.83.up_proj", "model.layers.88.mlp.experts.84.up_proj", "model.layers.88.mlp.experts.85.up_proj", "model.layers.88.mlp.experts.86.up_proj", "model.layers.88.mlp.experts.87.up_proj", "model.layers.88.mlp.experts.88.up_proj", "model.layers.88.mlp.experts.89.up_proj", "model.layers.88.mlp.experts.90.up_proj", "model.layers.88.mlp.experts.91.up_proj", "model.layers.88.mlp.experts.92.up_proj", "model.layers.88.mlp.experts.93.up_proj", "model.layers.88.mlp.experts.94.up_proj", "model.layers.88.mlp.experts.95.up_proj", "model.layers.88.mlp.experts.96.up_proj", "model.layers.88.mlp.experts.97.up_proj", "model.layers.88.mlp.experts.98.up_proj", "model.layers.88.mlp.experts.99.up_proj", "model.layers.88.mlp.experts.100.up_proj", "model.layers.88.mlp.experts.101.up_proj", "model.layers.88.mlp.experts.102.up_proj", "model.layers.88.mlp.experts.103.up_proj", "model.layers.88.mlp.experts.104.up_proj", "model.layers.88.mlp.experts.105.up_proj", "model.layers.88.mlp.experts.106.up_proj", "model.layers.88.mlp.experts.107.up_proj", "model.layers.88.mlp.experts.108.up_proj", "model.layers.88.mlp.experts.109.up_proj", "model.layers.88.mlp.experts.110.up_proj", "model.layers.88.mlp.experts.111.up_proj", "model.layers.88.mlp.experts.112.up_proj", "model.layers.88.mlp.experts.113.up_proj", "model.layers.88.mlp.experts.114.up_proj", "model.layers.88.mlp.experts.115.up_proj", "model.layers.88.mlp.experts.116.up_proj", "model.layers.88.mlp.experts.117.up_proj", "model.layers.88.mlp.experts.118.up_proj", "model.layers.88.mlp.experts.119.up_proj", "model.layers.88.mlp.experts.120.up_proj", "model.layers.88.mlp.experts.121.up_proj", "model.layers.88.mlp.experts.122.up_proj", "model.layers.88.mlp.experts.123.up_proj", "model.layers.88.mlp.experts.124.up_proj", "model.layers.88.mlp.experts.125.up_proj", "model.layers.88.mlp.experts.126.up_proj", "model.layers.88.mlp.experts.127.up_proj", "model.layers.88.mlp.experts.128.up_proj", "model.layers.88.mlp.experts.129.up_proj", "model.layers.88.mlp.experts.130.up_proj", "model.layers.88.mlp.experts.131.up_proj", "model.layers.88.mlp.experts.132.up_proj", "model.layers.88.mlp.experts.133.up_proj", "model.layers.88.mlp.experts.134.up_proj", "model.layers.88.mlp.experts.135.up_proj", "model.layers.88.mlp.experts.136.up_proj", "model.layers.88.mlp.experts.137.up_proj", "model.layers.88.mlp.experts.138.up_proj", "model.layers.88.mlp.experts.139.up_proj", "model.layers.88.mlp.experts.140.up_proj", "model.layers.88.mlp.experts.141.up_proj", "model.layers.88.mlp.experts.142.up_proj", "model.layers.88.mlp.experts.143.up_proj", "model.layers.88.mlp.experts.144.up_proj", "model.layers.88.mlp.experts.145.up_proj", "model.layers.88.mlp.experts.146.up_proj", "model.layers.88.mlp.experts.147.up_proj", "model.layers.88.mlp.experts.148.up_proj", "model.layers.88.mlp.experts.149.up_proj", "model.layers.88.mlp.experts.150.up_proj", "model.layers.88.mlp.experts.151.up_proj", "model.layers.88.mlp.experts.152.up_proj", "model.layers.88.mlp.experts.153.up_proj", "model.layers.88.mlp.experts.154.up_proj", "model.layers.88.mlp.experts.155.up_proj", "model.layers.88.mlp.experts.156.up_proj", "model.layers.88.mlp.experts.157.up_proj", "model.layers.88.mlp.experts.158.up_proj", "model.layers.88.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -2.0379899069652985e-06, "dbits": 2516582400 }, { "dkld": -5.154148675501e-06, "dbits": 5033164800 } ] }, { "idx": 530, "layers": [ "model.layers.88.mlp.experts.0.down_proj", "model.layers.88.mlp.experts.1.down_proj", "model.layers.88.mlp.experts.2.down_proj", "model.layers.88.mlp.experts.3.down_proj", "model.layers.88.mlp.experts.4.down_proj", "model.layers.88.mlp.experts.5.down_proj", "model.layers.88.mlp.experts.6.down_proj", "model.layers.88.mlp.experts.7.down_proj", "model.layers.88.mlp.experts.8.down_proj", "model.layers.88.mlp.experts.9.down_proj", "model.layers.88.mlp.experts.10.down_proj", "model.layers.88.mlp.experts.11.down_proj", "model.layers.88.mlp.experts.12.down_proj", "model.layers.88.mlp.experts.13.down_proj", "model.layers.88.mlp.experts.14.down_proj", "model.layers.88.mlp.experts.15.down_proj", "model.layers.88.mlp.experts.16.down_proj", "model.layers.88.mlp.experts.17.down_proj", "model.layers.88.mlp.experts.18.down_proj", "model.layers.88.mlp.experts.19.down_proj", "model.layers.88.mlp.experts.20.down_proj", "model.layers.88.mlp.experts.21.down_proj", "model.layers.88.mlp.experts.22.down_proj", "model.layers.88.mlp.experts.23.down_proj", "model.layers.88.mlp.experts.24.down_proj", "model.layers.88.mlp.experts.25.down_proj", "model.layers.88.mlp.experts.26.down_proj", "model.layers.88.mlp.experts.27.down_proj", "model.layers.88.mlp.experts.28.down_proj", "model.layers.88.mlp.experts.29.down_proj", "model.layers.88.mlp.experts.30.down_proj", "model.layers.88.mlp.experts.31.down_proj", "model.layers.88.mlp.experts.32.down_proj", "model.layers.88.mlp.experts.33.down_proj", "model.layers.88.mlp.experts.34.down_proj", "model.layers.88.mlp.experts.35.down_proj", "model.layers.88.mlp.experts.36.down_proj", "model.layers.88.mlp.experts.37.down_proj", "model.layers.88.mlp.experts.38.down_proj", "model.layers.88.mlp.experts.39.down_proj", "model.layers.88.mlp.experts.40.down_proj", "model.layers.88.mlp.experts.41.down_proj", "model.layers.88.mlp.experts.42.down_proj", "model.layers.88.mlp.experts.43.down_proj", "model.layers.88.mlp.experts.44.down_proj", "model.layers.88.mlp.experts.45.down_proj", "model.layers.88.mlp.experts.46.down_proj", "model.layers.88.mlp.experts.47.down_proj", "model.layers.88.mlp.experts.48.down_proj", "model.layers.88.mlp.experts.49.down_proj", "model.layers.88.mlp.experts.50.down_proj", "model.layers.88.mlp.experts.51.down_proj", "model.layers.88.mlp.experts.52.down_proj", "model.layers.88.mlp.experts.53.down_proj", "model.layers.88.mlp.experts.54.down_proj", "model.layers.88.mlp.experts.55.down_proj", "model.layers.88.mlp.experts.56.down_proj", "model.layers.88.mlp.experts.57.down_proj", "model.layers.88.mlp.experts.58.down_proj", "model.layers.88.mlp.experts.59.down_proj", "model.layers.88.mlp.experts.60.down_proj", "model.layers.88.mlp.experts.61.down_proj", "model.layers.88.mlp.experts.62.down_proj", "model.layers.88.mlp.experts.63.down_proj", "model.layers.88.mlp.experts.64.down_proj", "model.layers.88.mlp.experts.65.down_proj", "model.layers.88.mlp.experts.66.down_proj", "model.layers.88.mlp.experts.67.down_proj", "model.layers.88.mlp.experts.68.down_proj", "model.layers.88.mlp.experts.69.down_proj", "model.layers.88.mlp.experts.70.down_proj", "model.layers.88.mlp.experts.71.down_proj", "model.layers.88.mlp.experts.72.down_proj", "model.layers.88.mlp.experts.73.down_proj", "model.layers.88.mlp.experts.74.down_proj", "model.layers.88.mlp.experts.75.down_proj", "model.layers.88.mlp.experts.76.down_proj", "model.layers.88.mlp.experts.77.down_proj", "model.layers.88.mlp.experts.78.down_proj", "model.layers.88.mlp.experts.79.down_proj", "model.layers.88.mlp.experts.80.down_proj", "model.layers.88.mlp.experts.81.down_proj", "model.layers.88.mlp.experts.82.down_proj", "model.layers.88.mlp.experts.83.down_proj", "model.layers.88.mlp.experts.84.down_proj", "model.layers.88.mlp.experts.85.down_proj", "model.layers.88.mlp.experts.86.down_proj", "model.layers.88.mlp.experts.87.down_proj", "model.layers.88.mlp.experts.88.down_proj", "model.layers.88.mlp.experts.89.down_proj", "model.layers.88.mlp.experts.90.down_proj", "model.layers.88.mlp.experts.91.down_proj", "model.layers.88.mlp.experts.92.down_proj", "model.layers.88.mlp.experts.93.down_proj", "model.layers.88.mlp.experts.94.down_proj", "model.layers.88.mlp.experts.95.down_proj", "model.layers.88.mlp.experts.96.down_proj", "model.layers.88.mlp.experts.97.down_proj", "model.layers.88.mlp.experts.98.down_proj", "model.layers.88.mlp.experts.99.down_proj", "model.layers.88.mlp.experts.100.down_proj", "model.layers.88.mlp.experts.101.down_proj", "model.layers.88.mlp.experts.102.down_proj", "model.layers.88.mlp.experts.103.down_proj", "model.layers.88.mlp.experts.104.down_proj", "model.layers.88.mlp.experts.105.down_proj", "model.layers.88.mlp.experts.106.down_proj", "model.layers.88.mlp.experts.107.down_proj", "model.layers.88.mlp.experts.108.down_proj", "model.layers.88.mlp.experts.109.down_proj", "model.layers.88.mlp.experts.110.down_proj", "model.layers.88.mlp.experts.111.down_proj", "model.layers.88.mlp.experts.112.down_proj", "model.layers.88.mlp.experts.113.down_proj", "model.layers.88.mlp.experts.114.down_proj", "model.layers.88.mlp.experts.115.down_proj", "model.layers.88.mlp.experts.116.down_proj", "model.layers.88.mlp.experts.117.down_proj", "model.layers.88.mlp.experts.118.down_proj", "model.layers.88.mlp.experts.119.down_proj", "model.layers.88.mlp.experts.120.down_proj", "model.layers.88.mlp.experts.121.down_proj", "model.layers.88.mlp.experts.122.down_proj", "model.layers.88.mlp.experts.123.down_proj", "model.layers.88.mlp.experts.124.down_proj", "model.layers.88.mlp.experts.125.down_proj", "model.layers.88.mlp.experts.126.down_proj", "model.layers.88.mlp.experts.127.down_proj", "model.layers.88.mlp.experts.128.down_proj", "model.layers.88.mlp.experts.129.down_proj", "model.layers.88.mlp.experts.130.down_proj", "model.layers.88.mlp.experts.131.down_proj", "model.layers.88.mlp.experts.132.down_proj", "model.layers.88.mlp.experts.133.down_proj", "model.layers.88.mlp.experts.134.down_proj", "model.layers.88.mlp.experts.135.down_proj", "model.layers.88.mlp.experts.136.down_proj", "model.layers.88.mlp.experts.137.down_proj", "model.layers.88.mlp.experts.138.down_proj", "model.layers.88.mlp.experts.139.down_proj", "model.layers.88.mlp.experts.140.down_proj", "model.layers.88.mlp.experts.141.down_proj", "model.layers.88.mlp.experts.142.down_proj", "model.layers.88.mlp.experts.143.down_proj", "model.layers.88.mlp.experts.144.down_proj", "model.layers.88.mlp.experts.145.down_proj", "model.layers.88.mlp.experts.146.down_proj", "model.layers.88.mlp.experts.147.down_proj", "model.layers.88.mlp.experts.148.down_proj", "model.layers.88.mlp.experts.149.down_proj", "model.layers.88.mlp.experts.150.down_proj", "model.layers.88.mlp.experts.151.down_proj", "model.layers.88.mlp.experts.152.down_proj", "model.layers.88.mlp.experts.153.down_proj", "model.layers.88.mlp.experts.154.down_proj", "model.layers.88.mlp.experts.155.down_proj", "model.layers.88.mlp.experts.156.down_proj", "model.layers.88.mlp.experts.157.down_proj", "model.layers.88.mlp.experts.158.down_proj", "model.layers.88.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 4.401896148920059e-06, "dbits": 1258291200 }, { "dkld": -2.0020874217149126e-06, "dbits": 2516582400 } ] }, { "idx": 531, "layers": [ "model.layers.89.self_attn.q_proj" ], "candidates": [ { "dkld": -3.999911714345182e-05, "dbits": 62914560 }, { "dkld": -4.436024464666774e-05, "dbits": 125829120 } ] }, { "idx": 532, "layers": [ "model.layers.89.self_attn.k_proj", "model.layers.89.self_attn.v_proj" ], "candidates": [ { "dkld": -9.884731844067574e-05, "dbits": 10485760 }, { "dkld": -7.799009326845373e-05, "dbits": 20971520 } ] }, { "idx": 533, "layers": [ "model.layers.89.self_attn.o_proj" ], "candidates": [ { "dkld": -1.8325750716030598e-05, "dbits": 62914560 }, { "dkld": -1.799701713025431e-05, "dbits": 125829120 } ] }, { "idx": 534, "layers": [ "model.layers.89.mlp.shared_experts.gate_proj", "model.layers.89.mlp.shared_experts.up_proj", "model.layers.89.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -3.620688803493942e-05, "dbits": 23592960 }, { "dkld": -5.639644805341924e-05, "dbits": 47185920 } ] }, { "idx": 535, "layers": [ "model.layers.89.mlp.experts.0.gate_proj", "model.layers.89.mlp.experts.1.gate_proj", "model.layers.89.mlp.experts.2.gate_proj", "model.layers.89.mlp.experts.3.gate_proj", "model.layers.89.mlp.experts.4.gate_proj", "model.layers.89.mlp.experts.5.gate_proj", "model.layers.89.mlp.experts.6.gate_proj", "model.layers.89.mlp.experts.7.gate_proj", "model.layers.89.mlp.experts.8.gate_proj", "model.layers.89.mlp.experts.9.gate_proj", "model.layers.89.mlp.experts.10.gate_proj", "model.layers.89.mlp.experts.11.gate_proj", "model.layers.89.mlp.experts.12.gate_proj", "model.layers.89.mlp.experts.13.gate_proj", "model.layers.89.mlp.experts.14.gate_proj", "model.layers.89.mlp.experts.15.gate_proj", "model.layers.89.mlp.experts.16.gate_proj", "model.layers.89.mlp.experts.17.gate_proj", "model.layers.89.mlp.experts.18.gate_proj", "model.layers.89.mlp.experts.19.gate_proj", "model.layers.89.mlp.experts.20.gate_proj", "model.layers.89.mlp.experts.21.gate_proj", "model.layers.89.mlp.experts.22.gate_proj", "model.layers.89.mlp.experts.23.gate_proj", "model.layers.89.mlp.experts.24.gate_proj", "model.layers.89.mlp.experts.25.gate_proj", "model.layers.89.mlp.experts.26.gate_proj", "model.layers.89.mlp.experts.27.gate_proj", "model.layers.89.mlp.experts.28.gate_proj", "model.layers.89.mlp.experts.29.gate_proj", "model.layers.89.mlp.experts.30.gate_proj", "model.layers.89.mlp.experts.31.gate_proj", "model.layers.89.mlp.experts.32.gate_proj", "model.layers.89.mlp.experts.33.gate_proj", "model.layers.89.mlp.experts.34.gate_proj", "model.layers.89.mlp.experts.35.gate_proj", "model.layers.89.mlp.experts.36.gate_proj", "model.layers.89.mlp.experts.37.gate_proj", "model.layers.89.mlp.experts.38.gate_proj", "model.layers.89.mlp.experts.39.gate_proj", "model.layers.89.mlp.experts.40.gate_proj", "model.layers.89.mlp.experts.41.gate_proj", "model.layers.89.mlp.experts.42.gate_proj", "model.layers.89.mlp.experts.43.gate_proj", "model.layers.89.mlp.experts.44.gate_proj", "model.layers.89.mlp.experts.45.gate_proj", "model.layers.89.mlp.experts.46.gate_proj", "model.layers.89.mlp.experts.47.gate_proj", "model.layers.89.mlp.experts.48.gate_proj", "model.layers.89.mlp.experts.49.gate_proj", "model.layers.89.mlp.experts.50.gate_proj", "model.layers.89.mlp.experts.51.gate_proj", "model.layers.89.mlp.experts.52.gate_proj", "model.layers.89.mlp.experts.53.gate_proj", "model.layers.89.mlp.experts.54.gate_proj", "model.layers.89.mlp.experts.55.gate_proj", "model.layers.89.mlp.experts.56.gate_proj", "model.layers.89.mlp.experts.57.gate_proj", "model.layers.89.mlp.experts.58.gate_proj", "model.layers.89.mlp.experts.59.gate_proj", "model.layers.89.mlp.experts.60.gate_proj", "model.layers.89.mlp.experts.61.gate_proj", "model.layers.89.mlp.experts.62.gate_proj", "model.layers.89.mlp.experts.63.gate_proj", "model.layers.89.mlp.experts.64.gate_proj", "model.layers.89.mlp.experts.65.gate_proj", "model.layers.89.mlp.experts.66.gate_proj", "model.layers.89.mlp.experts.67.gate_proj", "model.layers.89.mlp.experts.68.gate_proj", "model.layers.89.mlp.experts.69.gate_proj", "model.layers.89.mlp.experts.70.gate_proj", "model.layers.89.mlp.experts.71.gate_proj", "model.layers.89.mlp.experts.72.gate_proj", "model.layers.89.mlp.experts.73.gate_proj", "model.layers.89.mlp.experts.74.gate_proj", "model.layers.89.mlp.experts.75.gate_proj", "model.layers.89.mlp.experts.76.gate_proj", "model.layers.89.mlp.experts.77.gate_proj", "model.layers.89.mlp.experts.78.gate_proj", "model.layers.89.mlp.experts.79.gate_proj", "model.layers.89.mlp.experts.80.gate_proj", "model.layers.89.mlp.experts.81.gate_proj", "model.layers.89.mlp.experts.82.gate_proj", "model.layers.89.mlp.experts.83.gate_proj", "model.layers.89.mlp.experts.84.gate_proj", "model.layers.89.mlp.experts.85.gate_proj", "model.layers.89.mlp.experts.86.gate_proj", "model.layers.89.mlp.experts.87.gate_proj", "model.layers.89.mlp.experts.88.gate_proj", "model.layers.89.mlp.experts.89.gate_proj", "model.layers.89.mlp.experts.90.gate_proj", "model.layers.89.mlp.experts.91.gate_proj", "model.layers.89.mlp.experts.92.gate_proj", "model.layers.89.mlp.experts.93.gate_proj", "model.layers.89.mlp.experts.94.gate_proj", "model.layers.89.mlp.experts.95.gate_proj", "model.layers.89.mlp.experts.96.gate_proj", "model.layers.89.mlp.experts.97.gate_proj", "model.layers.89.mlp.experts.98.gate_proj", "model.layers.89.mlp.experts.99.gate_proj", "model.layers.89.mlp.experts.100.gate_proj", "model.layers.89.mlp.experts.101.gate_proj", "model.layers.89.mlp.experts.102.gate_proj", "model.layers.89.mlp.experts.103.gate_proj", "model.layers.89.mlp.experts.104.gate_proj", "model.layers.89.mlp.experts.105.gate_proj", "model.layers.89.mlp.experts.106.gate_proj", "model.layers.89.mlp.experts.107.gate_proj", "model.layers.89.mlp.experts.108.gate_proj", "model.layers.89.mlp.experts.109.gate_proj", "model.layers.89.mlp.experts.110.gate_proj", "model.layers.89.mlp.experts.111.gate_proj", "model.layers.89.mlp.experts.112.gate_proj", "model.layers.89.mlp.experts.113.gate_proj", "model.layers.89.mlp.experts.114.gate_proj", "model.layers.89.mlp.experts.115.gate_proj", "model.layers.89.mlp.experts.116.gate_proj", "model.layers.89.mlp.experts.117.gate_proj", "model.layers.89.mlp.experts.118.gate_proj", "model.layers.89.mlp.experts.119.gate_proj", "model.layers.89.mlp.experts.120.gate_proj", "model.layers.89.mlp.experts.121.gate_proj", "model.layers.89.mlp.experts.122.gate_proj", "model.layers.89.mlp.experts.123.gate_proj", "model.layers.89.mlp.experts.124.gate_proj", "model.layers.89.mlp.experts.125.gate_proj", "model.layers.89.mlp.experts.126.gate_proj", "model.layers.89.mlp.experts.127.gate_proj", "model.layers.89.mlp.experts.128.gate_proj", "model.layers.89.mlp.experts.129.gate_proj", "model.layers.89.mlp.experts.130.gate_proj", "model.layers.89.mlp.experts.131.gate_proj", "model.layers.89.mlp.experts.132.gate_proj", "model.layers.89.mlp.experts.133.gate_proj", "model.layers.89.mlp.experts.134.gate_proj", "model.layers.89.mlp.experts.135.gate_proj", "model.layers.89.mlp.experts.136.gate_proj", "model.layers.89.mlp.experts.137.gate_proj", "model.layers.89.mlp.experts.138.gate_proj", "model.layers.89.mlp.experts.139.gate_proj", "model.layers.89.mlp.experts.140.gate_proj", "model.layers.89.mlp.experts.141.gate_proj", "model.layers.89.mlp.experts.142.gate_proj", "model.layers.89.mlp.experts.143.gate_proj", "model.layers.89.mlp.experts.144.gate_proj", "model.layers.89.mlp.experts.145.gate_proj", "model.layers.89.mlp.experts.146.gate_proj", "model.layers.89.mlp.experts.147.gate_proj", "model.layers.89.mlp.experts.148.gate_proj", "model.layers.89.mlp.experts.149.gate_proj", "model.layers.89.mlp.experts.150.gate_proj", "model.layers.89.mlp.experts.151.gate_proj", "model.layers.89.mlp.experts.152.gate_proj", "model.layers.89.mlp.experts.153.gate_proj", "model.layers.89.mlp.experts.154.gate_proj", "model.layers.89.mlp.experts.155.gate_proj", "model.layers.89.mlp.experts.156.gate_proj", "model.layers.89.mlp.experts.157.gate_proj", "model.layers.89.mlp.experts.158.gate_proj", "model.layers.89.mlp.experts.159.gate_proj", "model.layers.89.mlp.experts.0.up_proj", "model.layers.89.mlp.experts.1.up_proj", "model.layers.89.mlp.experts.2.up_proj", "model.layers.89.mlp.experts.3.up_proj", "model.layers.89.mlp.experts.4.up_proj", "model.layers.89.mlp.experts.5.up_proj", "model.layers.89.mlp.experts.6.up_proj", "model.layers.89.mlp.experts.7.up_proj", "model.layers.89.mlp.experts.8.up_proj", "model.layers.89.mlp.experts.9.up_proj", "model.layers.89.mlp.experts.10.up_proj", "model.layers.89.mlp.experts.11.up_proj", "model.layers.89.mlp.experts.12.up_proj", "model.layers.89.mlp.experts.13.up_proj", "model.layers.89.mlp.experts.14.up_proj", "model.layers.89.mlp.experts.15.up_proj", "model.layers.89.mlp.experts.16.up_proj", "model.layers.89.mlp.experts.17.up_proj", "model.layers.89.mlp.experts.18.up_proj", "model.layers.89.mlp.experts.19.up_proj", "model.layers.89.mlp.experts.20.up_proj", "model.layers.89.mlp.experts.21.up_proj", "model.layers.89.mlp.experts.22.up_proj", "model.layers.89.mlp.experts.23.up_proj", "model.layers.89.mlp.experts.24.up_proj", "model.layers.89.mlp.experts.25.up_proj", "model.layers.89.mlp.experts.26.up_proj", "model.layers.89.mlp.experts.27.up_proj", "model.layers.89.mlp.experts.28.up_proj", "model.layers.89.mlp.experts.29.up_proj", "model.layers.89.mlp.experts.30.up_proj", "model.layers.89.mlp.experts.31.up_proj", "model.layers.89.mlp.experts.32.up_proj", "model.layers.89.mlp.experts.33.up_proj", "model.layers.89.mlp.experts.34.up_proj", "model.layers.89.mlp.experts.35.up_proj", "model.layers.89.mlp.experts.36.up_proj", "model.layers.89.mlp.experts.37.up_proj", "model.layers.89.mlp.experts.38.up_proj", "model.layers.89.mlp.experts.39.up_proj", "model.layers.89.mlp.experts.40.up_proj", "model.layers.89.mlp.experts.41.up_proj", "model.layers.89.mlp.experts.42.up_proj", "model.layers.89.mlp.experts.43.up_proj", "model.layers.89.mlp.experts.44.up_proj", "model.layers.89.mlp.experts.45.up_proj", "model.layers.89.mlp.experts.46.up_proj", "model.layers.89.mlp.experts.47.up_proj", "model.layers.89.mlp.experts.48.up_proj", "model.layers.89.mlp.experts.49.up_proj", "model.layers.89.mlp.experts.50.up_proj", "model.layers.89.mlp.experts.51.up_proj", "model.layers.89.mlp.experts.52.up_proj", "model.layers.89.mlp.experts.53.up_proj", "model.layers.89.mlp.experts.54.up_proj", "model.layers.89.mlp.experts.55.up_proj", "model.layers.89.mlp.experts.56.up_proj", "model.layers.89.mlp.experts.57.up_proj", "model.layers.89.mlp.experts.58.up_proj", "model.layers.89.mlp.experts.59.up_proj", "model.layers.89.mlp.experts.60.up_proj", "model.layers.89.mlp.experts.61.up_proj", "model.layers.89.mlp.experts.62.up_proj", "model.layers.89.mlp.experts.63.up_proj", "model.layers.89.mlp.experts.64.up_proj", "model.layers.89.mlp.experts.65.up_proj", "model.layers.89.mlp.experts.66.up_proj", "model.layers.89.mlp.experts.67.up_proj", "model.layers.89.mlp.experts.68.up_proj", "model.layers.89.mlp.experts.69.up_proj", "model.layers.89.mlp.experts.70.up_proj", "model.layers.89.mlp.experts.71.up_proj", "model.layers.89.mlp.experts.72.up_proj", "model.layers.89.mlp.experts.73.up_proj", "model.layers.89.mlp.experts.74.up_proj", "model.layers.89.mlp.experts.75.up_proj", "model.layers.89.mlp.experts.76.up_proj", "model.layers.89.mlp.experts.77.up_proj", "model.layers.89.mlp.experts.78.up_proj", "model.layers.89.mlp.experts.79.up_proj", "model.layers.89.mlp.experts.80.up_proj", "model.layers.89.mlp.experts.81.up_proj", "model.layers.89.mlp.experts.82.up_proj", "model.layers.89.mlp.experts.83.up_proj", "model.layers.89.mlp.experts.84.up_proj", "model.layers.89.mlp.experts.85.up_proj", "model.layers.89.mlp.experts.86.up_proj", "model.layers.89.mlp.experts.87.up_proj", "model.layers.89.mlp.experts.88.up_proj", "model.layers.89.mlp.experts.89.up_proj", "model.layers.89.mlp.experts.90.up_proj", "model.layers.89.mlp.experts.91.up_proj", "model.layers.89.mlp.experts.92.up_proj", "model.layers.89.mlp.experts.93.up_proj", "model.layers.89.mlp.experts.94.up_proj", "model.layers.89.mlp.experts.95.up_proj", "model.layers.89.mlp.experts.96.up_proj", "model.layers.89.mlp.experts.97.up_proj", "model.layers.89.mlp.experts.98.up_proj", "model.layers.89.mlp.experts.99.up_proj", "model.layers.89.mlp.experts.100.up_proj", "model.layers.89.mlp.experts.101.up_proj", "model.layers.89.mlp.experts.102.up_proj", "model.layers.89.mlp.experts.103.up_proj", "model.layers.89.mlp.experts.104.up_proj", "model.layers.89.mlp.experts.105.up_proj", "model.layers.89.mlp.experts.106.up_proj", "model.layers.89.mlp.experts.107.up_proj", "model.layers.89.mlp.experts.108.up_proj", "model.layers.89.mlp.experts.109.up_proj", "model.layers.89.mlp.experts.110.up_proj", "model.layers.89.mlp.experts.111.up_proj", "model.layers.89.mlp.experts.112.up_proj", "model.layers.89.mlp.experts.113.up_proj", "model.layers.89.mlp.experts.114.up_proj", "model.layers.89.mlp.experts.115.up_proj", "model.layers.89.mlp.experts.116.up_proj", "model.layers.89.mlp.experts.117.up_proj", "model.layers.89.mlp.experts.118.up_proj", "model.layers.89.mlp.experts.119.up_proj", "model.layers.89.mlp.experts.120.up_proj", "model.layers.89.mlp.experts.121.up_proj", "model.layers.89.mlp.experts.122.up_proj", "model.layers.89.mlp.experts.123.up_proj", "model.layers.89.mlp.experts.124.up_proj", "model.layers.89.mlp.experts.125.up_proj", "model.layers.89.mlp.experts.126.up_proj", "model.layers.89.mlp.experts.127.up_proj", "model.layers.89.mlp.experts.128.up_proj", "model.layers.89.mlp.experts.129.up_proj", "model.layers.89.mlp.experts.130.up_proj", "model.layers.89.mlp.experts.131.up_proj", "model.layers.89.mlp.experts.132.up_proj", "model.layers.89.mlp.experts.133.up_proj", "model.layers.89.mlp.experts.134.up_proj", "model.layers.89.mlp.experts.135.up_proj", "model.layers.89.mlp.experts.136.up_proj", "model.layers.89.mlp.experts.137.up_proj", "model.layers.89.mlp.experts.138.up_proj", "model.layers.89.mlp.experts.139.up_proj", "model.layers.89.mlp.experts.140.up_proj", "model.layers.89.mlp.experts.141.up_proj", "model.layers.89.mlp.experts.142.up_proj", "model.layers.89.mlp.experts.143.up_proj", "model.layers.89.mlp.experts.144.up_proj", "model.layers.89.mlp.experts.145.up_proj", "model.layers.89.mlp.experts.146.up_proj", "model.layers.89.mlp.experts.147.up_proj", "model.layers.89.mlp.experts.148.up_proj", "model.layers.89.mlp.experts.149.up_proj", "model.layers.89.mlp.experts.150.up_proj", "model.layers.89.mlp.experts.151.up_proj", "model.layers.89.mlp.experts.152.up_proj", "model.layers.89.mlp.experts.153.up_proj", "model.layers.89.mlp.experts.154.up_proj", "model.layers.89.mlp.experts.155.up_proj", "model.layers.89.mlp.experts.156.up_proj", "model.layers.89.mlp.experts.157.up_proj", "model.layers.89.mlp.experts.158.up_proj", "model.layers.89.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -3.0974391847845423e-06, "dbits": 2516582400 }, { "dkld": -4.713609814643166e-06, "dbits": 5033164800 } ] }, { "idx": 536, "layers": [ "model.layers.89.mlp.experts.0.down_proj", "model.layers.89.mlp.experts.1.down_proj", "model.layers.89.mlp.experts.2.down_proj", "model.layers.89.mlp.experts.3.down_proj", "model.layers.89.mlp.experts.4.down_proj", "model.layers.89.mlp.experts.5.down_proj", "model.layers.89.mlp.experts.6.down_proj", "model.layers.89.mlp.experts.7.down_proj", "model.layers.89.mlp.experts.8.down_proj", "model.layers.89.mlp.experts.9.down_proj", "model.layers.89.mlp.experts.10.down_proj", "model.layers.89.mlp.experts.11.down_proj", "model.layers.89.mlp.experts.12.down_proj", "model.layers.89.mlp.experts.13.down_proj", "model.layers.89.mlp.experts.14.down_proj", "model.layers.89.mlp.experts.15.down_proj", "model.layers.89.mlp.experts.16.down_proj", "model.layers.89.mlp.experts.17.down_proj", "model.layers.89.mlp.experts.18.down_proj", "model.layers.89.mlp.experts.19.down_proj", "model.layers.89.mlp.experts.20.down_proj", "model.layers.89.mlp.experts.21.down_proj", "model.layers.89.mlp.experts.22.down_proj", "model.layers.89.mlp.experts.23.down_proj", "model.layers.89.mlp.experts.24.down_proj", "model.layers.89.mlp.experts.25.down_proj", "model.layers.89.mlp.experts.26.down_proj", "model.layers.89.mlp.experts.27.down_proj", "model.layers.89.mlp.experts.28.down_proj", "model.layers.89.mlp.experts.29.down_proj", "model.layers.89.mlp.experts.30.down_proj", "model.layers.89.mlp.experts.31.down_proj", "model.layers.89.mlp.experts.32.down_proj", "model.layers.89.mlp.experts.33.down_proj", "model.layers.89.mlp.experts.34.down_proj", "model.layers.89.mlp.experts.35.down_proj", "model.layers.89.mlp.experts.36.down_proj", "model.layers.89.mlp.experts.37.down_proj", "model.layers.89.mlp.experts.38.down_proj", "model.layers.89.mlp.experts.39.down_proj", "model.layers.89.mlp.experts.40.down_proj", "model.layers.89.mlp.experts.41.down_proj", "model.layers.89.mlp.experts.42.down_proj", "model.layers.89.mlp.experts.43.down_proj", "model.layers.89.mlp.experts.44.down_proj", "model.layers.89.mlp.experts.45.down_proj", "model.layers.89.mlp.experts.46.down_proj", "model.layers.89.mlp.experts.47.down_proj", "model.layers.89.mlp.experts.48.down_proj", "model.layers.89.mlp.experts.49.down_proj", "model.layers.89.mlp.experts.50.down_proj", "model.layers.89.mlp.experts.51.down_proj", "model.layers.89.mlp.experts.52.down_proj", "model.layers.89.mlp.experts.53.down_proj", "model.layers.89.mlp.experts.54.down_proj", "model.layers.89.mlp.experts.55.down_proj", "model.layers.89.mlp.experts.56.down_proj", "model.layers.89.mlp.experts.57.down_proj", "model.layers.89.mlp.experts.58.down_proj", "model.layers.89.mlp.experts.59.down_proj", "model.layers.89.mlp.experts.60.down_proj", "model.layers.89.mlp.experts.61.down_proj", "model.layers.89.mlp.experts.62.down_proj", "model.layers.89.mlp.experts.63.down_proj", "model.layers.89.mlp.experts.64.down_proj", "model.layers.89.mlp.experts.65.down_proj", "model.layers.89.mlp.experts.66.down_proj", "model.layers.89.mlp.experts.67.down_proj", "model.layers.89.mlp.experts.68.down_proj", "model.layers.89.mlp.experts.69.down_proj", "model.layers.89.mlp.experts.70.down_proj", "model.layers.89.mlp.experts.71.down_proj", "model.layers.89.mlp.experts.72.down_proj", "model.layers.89.mlp.experts.73.down_proj", "model.layers.89.mlp.experts.74.down_proj", "model.layers.89.mlp.experts.75.down_proj", "model.layers.89.mlp.experts.76.down_proj", "model.layers.89.mlp.experts.77.down_proj", "model.layers.89.mlp.experts.78.down_proj", "model.layers.89.mlp.experts.79.down_proj", "model.layers.89.mlp.experts.80.down_proj", "model.layers.89.mlp.experts.81.down_proj", "model.layers.89.mlp.experts.82.down_proj", "model.layers.89.mlp.experts.83.down_proj", "model.layers.89.mlp.experts.84.down_proj", "model.layers.89.mlp.experts.85.down_proj", "model.layers.89.mlp.experts.86.down_proj", "model.layers.89.mlp.experts.87.down_proj", "model.layers.89.mlp.experts.88.down_proj", "model.layers.89.mlp.experts.89.down_proj", "model.layers.89.mlp.experts.90.down_proj", "model.layers.89.mlp.experts.91.down_proj", "model.layers.89.mlp.experts.92.down_proj", "model.layers.89.mlp.experts.93.down_proj", "model.layers.89.mlp.experts.94.down_proj", "model.layers.89.mlp.experts.95.down_proj", "model.layers.89.mlp.experts.96.down_proj", "model.layers.89.mlp.experts.97.down_proj", "model.layers.89.mlp.experts.98.down_proj", "model.layers.89.mlp.experts.99.down_proj", "model.layers.89.mlp.experts.100.down_proj", "model.layers.89.mlp.experts.101.down_proj", "model.layers.89.mlp.experts.102.down_proj", "model.layers.89.mlp.experts.103.down_proj", "model.layers.89.mlp.experts.104.down_proj", "model.layers.89.mlp.experts.105.down_proj", "model.layers.89.mlp.experts.106.down_proj", "model.layers.89.mlp.experts.107.down_proj", "model.layers.89.mlp.experts.108.down_proj", "model.layers.89.mlp.experts.109.down_proj", "model.layers.89.mlp.experts.110.down_proj", "model.layers.89.mlp.experts.111.down_proj", "model.layers.89.mlp.experts.112.down_proj", "model.layers.89.mlp.experts.113.down_proj", "model.layers.89.mlp.experts.114.down_proj", "model.layers.89.mlp.experts.115.down_proj", "model.layers.89.mlp.experts.116.down_proj", "model.layers.89.mlp.experts.117.down_proj", "model.layers.89.mlp.experts.118.down_proj", "model.layers.89.mlp.experts.119.down_proj", "model.layers.89.mlp.experts.120.down_proj", "model.layers.89.mlp.experts.121.down_proj", "model.layers.89.mlp.experts.122.down_proj", "model.layers.89.mlp.experts.123.down_proj", "model.layers.89.mlp.experts.124.down_proj", "model.layers.89.mlp.experts.125.down_proj", "model.layers.89.mlp.experts.126.down_proj", "model.layers.89.mlp.experts.127.down_proj", "model.layers.89.mlp.experts.128.down_proj", "model.layers.89.mlp.experts.129.down_proj", "model.layers.89.mlp.experts.130.down_proj", "model.layers.89.mlp.experts.131.down_proj", "model.layers.89.mlp.experts.132.down_proj", "model.layers.89.mlp.experts.133.down_proj", "model.layers.89.mlp.experts.134.down_proj", "model.layers.89.mlp.experts.135.down_proj", "model.layers.89.mlp.experts.136.down_proj", "model.layers.89.mlp.experts.137.down_proj", "model.layers.89.mlp.experts.138.down_proj", "model.layers.89.mlp.experts.139.down_proj", "model.layers.89.mlp.experts.140.down_proj", "model.layers.89.mlp.experts.141.down_proj", "model.layers.89.mlp.experts.142.down_proj", "model.layers.89.mlp.experts.143.down_proj", "model.layers.89.mlp.experts.144.down_proj", "model.layers.89.mlp.experts.145.down_proj", "model.layers.89.mlp.experts.146.down_proj", "model.layers.89.mlp.experts.147.down_proj", "model.layers.89.mlp.experts.148.down_proj", "model.layers.89.mlp.experts.149.down_proj", "model.layers.89.mlp.experts.150.down_proj", "model.layers.89.mlp.experts.151.down_proj", "model.layers.89.mlp.experts.152.down_proj", "model.layers.89.mlp.experts.153.down_proj", "model.layers.89.mlp.experts.154.down_proj", "model.layers.89.mlp.experts.155.down_proj", "model.layers.89.mlp.experts.156.down_proj", "model.layers.89.mlp.experts.157.down_proj", "model.layers.89.mlp.experts.158.down_proj", "model.layers.89.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 4.7669745981832046e-07, "dbits": 1258291200 }, { "dkld": -8.25570896267891e-06, "dbits": 2516582400 } ] }, { "idx": 537, "layers": [ "model.layers.90.self_attn.q_proj" ], "candidates": [ { "dkld": -1.1207535862922668e-05, "dbits": 62914560 }, { "dkld": 7.048947736620903e-07, "dbits": 125829120 } ] }, { "idx": 538, "layers": [ "model.layers.90.self_attn.k_proj", "model.layers.90.self_attn.v_proj" ], "candidates": [ { "dkld": -5.2719167433677716e-05, "dbits": 10485760 }, { "dkld": -5.4322113282977494e-05, "dbits": 20971520 } ] }, { "idx": 539, "layers": [ "model.layers.90.self_attn.o_proj" ], "candidates": [ { "dkld": 8.344696834684112e-06, "dbits": 62914560 }, { "dkld": 3.758631646633842e-06, "dbits": 125829120 } ] }, { "idx": 540, "layers": [ "model.layers.90.mlp.shared_experts.gate_proj", "model.layers.90.mlp.shared_experts.up_proj", "model.layers.90.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -7.483065128326312e-05, "dbits": 23592960 }, { "dkld": -5.158535204827751e-05, "dbits": 47185920 } ] }, { "idx": 541, "layers": [ "model.layers.90.mlp.experts.0.gate_proj", "model.layers.90.mlp.experts.1.gate_proj", "model.layers.90.mlp.experts.2.gate_proj", "model.layers.90.mlp.experts.3.gate_proj", "model.layers.90.mlp.experts.4.gate_proj", "model.layers.90.mlp.experts.5.gate_proj", "model.layers.90.mlp.experts.6.gate_proj", "model.layers.90.mlp.experts.7.gate_proj", "model.layers.90.mlp.experts.8.gate_proj", "model.layers.90.mlp.experts.9.gate_proj", "model.layers.90.mlp.experts.10.gate_proj", "model.layers.90.mlp.experts.11.gate_proj", "model.layers.90.mlp.experts.12.gate_proj", "model.layers.90.mlp.experts.13.gate_proj", "model.layers.90.mlp.experts.14.gate_proj", "model.layers.90.mlp.experts.15.gate_proj", "model.layers.90.mlp.experts.16.gate_proj", "model.layers.90.mlp.experts.17.gate_proj", "model.layers.90.mlp.experts.18.gate_proj", "model.layers.90.mlp.experts.19.gate_proj", "model.layers.90.mlp.experts.20.gate_proj", "model.layers.90.mlp.experts.21.gate_proj", "model.layers.90.mlp.experts.22.gate_proj", "model.layers.90.mlp.experts.23.gate_proj", "model.layers.90.mlp.experts.24.gate_proj", "model.layers.90.mlp.experts.25.gate_proj", "model.layers.90.mlp.experts.26.gate_proj", "model.layers.90.mlp.experts.27.gate_proj", "model.layers.90.mlp.experts.28.gate_proj", "model.layers.90.mlp.experts.29.gate_proj", "model.layers.90.mlp.experts.30.gate_proj", "model.layers.90.mlp.experts.31.gate_proj", "model.layers.90.mlp.experts.32.gate_proj", "model.layers.90.mlp.experts.33.gate_proj", "model.layers.90.mlp.experts.34.gate_proj", "model.layers.90.mlp.experts.35.gate_proj", "model.layers.90.mlp.experts.36.gate_proj", "model.layers.90.mlp.experts.37.gate_proj", "model.layers.90.mlp.experts.38.gate_proj", "model.layers.90.mlp.experts.39.gate_proj", "model.layers.90.mlp.experts.40.gate_proj", "model.layers.90.mlp.experts.41.gate_proj", "model.layers.90.mlp.experts.42.gate_proj", "model.layers.90.mlp.experts.43.gate_proj", "model.layers.90.mlp.experts.44.gate_proj", "model.layers.90.mlp.experts.45.gate_proj", "model.layers.90.mlp.experts.46.gate_proj", "model.layers.90.mlp.experts.47.gate_proj", "model.layers.90.mlp.experts.48.gate_proj", "model.layers.90.mlp.experts.49.gate_proj", "model.layers.90.mlp.experts.50.gate_proj", "model.layers.90.mlp.experts.51.gate_proj", "model.layers.90.mlp.experts.52.gate_proj", "model.layers.90.mlp.experts.53.gate_proj", "model.layers.90.mlp.experts.54.gate_proj", "model.layers.90.mlp.experts.55.gate_proj", "model.layers.90.mlp.experts.56.gate_proj", "model.layers.90.mlp.experts.57.gate_proj", "model.layers.90.mlp.experts.58.gate_proj", "model.layers.90.mlp.experts.59.gate_proj", "model.layers.90.mlp.experts.60.gate_proj", "model.layers.90.mlp.experts.61.gate_proj", "model.layers.90.mlp.experts.62.gate_proj", "model.layers.90.mlp.experts.63.gate_proj", "model.layers.90.mlp.experts.64.gate_proj", "model.layers.90.mlp.experts.65.gate_proj", "model.layers.90.mlp.experts.66.gate_proj", "model.layers.90.mlp.experts.67.gate_proj", "model.layers.90.mlp.experts.68.gate_proj", "model.layers.90.mlp.experts.69.gate_proj", "model.layers.90.mlp.experts.70.gate_proj", "model.layers.90.mlp.experts.71.gate_proj", "model.layers.90.mlp.experts.72.gate_proj", "model.layers.90.mlp.experts.73.gate_proj", "model.layers.90.mlp.experts.74.gate_proj", "model.layers.90.mlp.experts.75.gate_proj", "model.layers.90.mlp.experts.76.gate_proj", "model.layers.90.mlp.experts.77.gate_proj", "model.layers.90.mlp.experts.78.gate_proj", "model.layers.90.mlp.experts.79.gate_proj", "model.layers.90.mlp.experts.80.gate_proj", "model.layers.90.mlp.experts.81.gate_proj", "model.layers.90.mlp.experts.82.gate_proj", "model.layers.90.mlp.experts.83.gate_proj", "model.layers.90.mlp.experts.84.gate_proj", "model.layers.90.mlp.experts.85.gate_proj", "model.layers.90.mlp.experts.86.gate_proj", "model.layers.90.mlp.experts.87.gate_proj", "model.layers.90.mlp.experts.88.gate_proj", "model.layers.90.mlp.experts.89.gate_proj", "model.layers.90.mlp.experts.90.gate_proj", "model.layers.90.mlp.experts.91.gate_proj", "model.layers.90.mlp.experts.92.gate_proj", "model.layers.90.mlp.experts.93.gate_proj", "model.layers.90.mlp.experts.94.gate_proj", "model.layers.90.mlp.experts.95.gate_proj", "model.layers.90.mlp.experts.96.gate_proj", "model.layers.90.mlp.experts.97.gate_proj", "model.layers.90.mlp.experts.98.gate_proj", "model.layers.90.mlp.experts.99.gate_proj", "model.layers.90.mlp.experts.100.gate_proj", "model.layers.90.mlp.experts.101.gate_proj", "model.layers.90.mlp.experts.102.gate_proj", "model.layers.90.mlp.experts.103.gate_proj", "model.layers.90.mlp.experts.104.gate_proj", "model.layers.90.mlp.experts.105.gate_proj", "model.layers.90.mlp.experts.106.gate_proj", "model.layers.90.mlp.experts.107.gate_proj", "model.layers.90.mlp.experts.108.gate_proj", "model.layers.90.mlp.experts.109.gate_proj", "model.layers.90.mlp.experts.110.gate_proj", "model.layers.90.mlp.experts.111.gate_proj", "model.layers.90.mlp.experts.112.gate_proj", "model.layers.90.mlp.experts.113.gate_proj", "model.layers.90.mlp.experts.114.gate_proj", "model.layers.90.mlp.experts.115.gate_proj", "model.layers.90.mlp.experts.116.gate_proj", "model.layers.90.mlp.experts.117.gate_proj", "model.layers.90.mlp.experts.118.gate_proj", "model.layers.90.mlp.experts.119.gate_proj", "model.layers.90.mlp.experts.120.gate_proj", "model.layers.90.mlp.experts.121.gate_proj", "model.layers.90.mlp.experts.122.gate_proj", "model.layers.90.mlp.experts.123.gate_proj", "model.layers.90.mlp.experts.124.gate_proj", "model.layers.90.mlp.experts.125.gate_proj", "model.layers.90.mlp.experts.126.gate_proj", "model.layers.90.mlp.experts.127.gate_proj", "model.layers.90.mlp.experts.128.gate_proj", "model.layers.90.mlp.experts.129.gate_proj", "model.layers.90.mlp.experts.130.gate_proj", "model.layers.90.mlp.experts.131.gate_proj", "model.layers.90.mlp.experts.132.gate_proj", "model.layers.90.mlp.experts.133.gate_proj", "model.layers.90.mlp.experts.134.gate_proj", "model.layers.90.mlp.experts.135.gate_proj", "model.layers.90.mlp.experts.136.gate_proj", "model.layers.90.mlp.experts.137.gate_proj", "model.layers.90.mlp.experts.138.gate_proj", "model.layers.90.mlp.experts.139.gate_proj", "model.layers.90.mlp.experts.140.gate_proj", "model.layers.90.mlp.experts.141.gate_proj", "model.layers.90.mlp.experts.142.gate_proj", "model.layers.90.mlp.experts.143.gate_proj", "model.layers.90.mlp.experts.144.gate_proj", "model.layers.90.mlp.experts.145.gate_proj", "model.layers.90.mlp.experts.146.gate_proj", "model.layers.90.mlp.experts.147.gate_proj", "model.layers.90.mlp.experts.148.gate_proj", "model.layers.90.mlp.experts.149.gate_proj", "model.layers.90.mlp.experts.150.gate_proj", "model.layers.90.mlp.experts.151.gate_proj", "model.layers.90.mlp.experts.152.gate_proj", "model.layers.90.mlp.experts.153.gate_proj", "model.layers.90.mlp.experts.154.gate_proj", "model.layers.90.mlp.experts.155.gate_proj", "model.layers.90.mlp.experts.156.gate_proj", "model.layers.90.mlp.experts.157.gate_proj", "model.layers.90.mlp.experts.158.gate_proj", "model.layers.90.mlp.experts.159.gate_proj", "model.layers.90.mlp.experts.0.up_proj", "model.layers.90.mlp.experts.1.up_proj", "model.layers.90.mlp.experts.2.up_proj", "model.layers.90.mlp.experts.3.up_proj", "model.layers.90.mlp.experts.4.up_proj", "model.layers.90.mlp.experts.5.up_proj", "model.layers.90.mlp.experts.6.up_proj", "model.layers.90.mlp.experts.7.up_proj", "model.layers.90.mlp.experts.8.up_proj", "model.layers.90.mlp.experts.9.up_proj", "model.layers.90.mlp.experts.10.up_proj", "model.layers.90.mlp.experts.11.up_proj", "model.layers.90.mlp.experts.12.up_proj", "model.layers.90.mlp.experts.13.up_proj", "model.layers.90.mlp.experts.14.up_proj", "model.layers.90.mlp.experts.15.up_proj", "model.layers.90.mlp.experts.16.up_proj", "model.layers.90.mlp.experts.17.up_proj", "model.layers.90.mlp.experts.18.up_proj", "model.layers.90.mlp.experts.19.up_proj", "model.layers.90.mlp.experts.20.up_proj", "model.layers.90.mlp.experts.21.up_proj", "model.layers.90.mlp.experts.22.up_proj", "model.layers.90.mlp.experts.23.up_proj", "model.layers.90.mlp.experts.24.up_proj", "model.layers.90.mlp.experts.25.up_proj", "model.layers.90.mlp.experts.26.up_proj", "model.layers.90.mlp.experts.27.up_proj", "model.layers.90.mlp.experts.28.up_proj", "model.layers.90.mlp.experts.29.up_proj", "model.layers.90.mlp.experts.30.up_proj", "model.layers.90.mlp.experts.31.up_proj", "model.layers.90.mlp.experts.32.up_proj", "model.layers.90.mlp.experts.33.up_proj", "model.layers.90.mlp.experts.34.up_proj", "model.layers.90.mlp.experts.35.up_proj", "model.layers.90.mlp.experts.36.up_proj", "model.layers.90.mlp.experts.37.up_proj", "model.layers.90.mlp.experts.38.up_proj", "model.layers.90.mlp.experts.39.up_proj", "model.layers.90.mlp.experts.40.up_proj", "model.layers.90.mlp.experts.41.up_proj", "model.layers.90.mlp.experts.42.up_proj", "model.layers.90.mlp.experts.43.up_proj", "model.layers.90.mlp.experts.44.up_proj", "model.layers.90.mlp.experts.45.up_proj", "model.layers.90.mlp.experts.46.up_proj", "model.layers.90.mlp.experts.47.up_proj", "model.layers.90.mlp.experts.48.up_proj", "model.layers.90.mlp.experts.49.up_proj", "model.layers.90.mlp.experts.50.up_proj", "model.layers.90.mlp.experts.51.up_proj", "model.layers.90.mlp.experts.52.up_proj", "model.layers.90.mlp.experts.53.up_proj", "model.layers.90.mlp.experts.54.up_proj", "model.layers.90.mlp.experts.55.up_proj", "model.layers.90.mlp.experts.56.up_proj", "model.layers.90.mlp.experts.57.up_proj", "model.layers.90.mlp.experts.58.up_proj", "model.layers.90.mlp.experts.59.up_proj", "model.layers.90.mlp.experts.60.up_proj", "model.layers.90.mlp.experts.61.up_proj", "model.layers.90.mlp.experts.62.up_proj", "model.layers.90.mlp.experts.63.up_proj", "model.layers.90.mlp.experts.64.up_proj", "model.layers.90.mlp.experts.65.up_proj", "model.layers.90.mlp.experts.66.up_proj", "model.layers.90.mlp.experts.67.up_proj", "model.layers.90.mlp.experts.68.up_proj", "model.layers.90.mlp.experts.69.up_proj", "model.layers.90.mlp.experts.70.up_proj", "model.layers.90.mlp.experts.71.up_proj", "model.layers.90.mlp.experts.72.up_proj", "model.layers.90.mlp.experts.73.up_proj", "model.layers.90.mlp.experts.74.up_proj", "model.layers.90.mlp.experts.75.up_proj", "model.layers.90.mlp.experts.76.up_proj", "model.layers.90.mlp.experts.77.up_proj", "model.layers.90.mlp.experts.78.up_proj", "model.layers.90.mlp.experts.79.up_proj", "model.layers.90.mlp.experts.80.up_proj", "model.layers.90.mlp.experts.81.up_proj", "model.layers.90.mlp.experts.82.up_proj", "model.layers.90.mlp.experts.83.up_proj", "model.layers.90.mlp.experts.84.up_proj", "model.layers.90.mlp.experts.85.up_proj", "model.layers.90.mlp.experts.86.up_proj", "model.layers.90.mlp.experts.87.up_proj", "model.layers.90.mlp.experts.88.up_proj", "model.layers.90.mlp.experts.89.up_proj", "model.layers.90.mlp.experts.90.up_proj", "model.layers.90.mlp.experts.91.up_proj", "model.layers.90.mlp.experts.92.up_proj", "model.layers.90.mlp.experts.93.up_proj", "model.layers.90.mlp.experts.94.up_proj", "model.layers.90.mlp.experts.95.up_proj", "model.layers.90.mlp.experts.96.up_proj", "model.layers.90.mlp.experts.97.up_proj", "model.layers.90.mlp.experts.98.up_proj", "model.layers.90.mlp.experts.99.up_proj", "model.layers.90.mlp.experts.100.up_proj", "model.layers.90.mlp.experts.101.up_proj", "model.layers.90.mlp.experts.102.up_proj", "model.layers.90.mlp.experts.103.up_proj", "model.layers.90.mlp.experts.104.up_proj", "model.layers.90.mlp.experts.105.up_proj", "model.layers.90.mlp.experts.106.up_proj", "model.layers.90.mlp.experts.107.up_proj", "model.layers.90.mlp.experts.108.up_proj", "model.layers.90.mlp.experts.109.up_proj", "model.layers.90.mlp.experts.110.up_proj", "model.layers.90.mlp.experts.111.up_proj", "model.layers.90.mlp.experts.112.up_proj", "model.layers.90.mlp.experts.113.up_proj", "model.layers.90.mlp.experts.114.up_proj", "model.layers.90.mlp.experts.115.up_proj", "model.layers.90.mlp.experts.116.up_proj", "model.layers.90.mlp.experts.117.up_proj", "model.layers.90.mlp.experts.118.up_proj", "model.layers.90.mlp.experts.119.up_proj", "model.layers.90.mlp.experts.120.up_proj", "model.layers.90.mlp.experts.121.up_proj", "model.layers.90.mlp.experts.122.up_proj", "model.layers.90.mlp.experts.123.up_proj", "model.layers.90.mlp.experts.124.up_proj", "model.layers.90.mlp.experts.125.up_proj", "model.layers.90.mlp.experts.126.up_proj", "model.layers.90.mlp.experts.127.up_proj", "model.layers.90.mlp.experts.128.up_proj", "model.layers.90.mlp.experts.129.up_proj", "model.layers.90.mlp.experts.130.up_proj", "model.layers.90.mlp.experts.131.up_proj", "model.layers.90.mlp.experts.132.up_proj", "model.layers.90.mlp.experts.133.up_proj", "model.layers.90.mlp.experts.134.up_proj", "model.layers.90.mlp.experts.135.up_proj", "model.layers.90.mlp.experts.136.up_proj", "model.layers.90.mlp.experts.137.up_proj", "model.layers.90.mlp.experts.138.up_proj", "model.layers.90.mlp.experts.139.up_proj", "model.layers.90.mlp.experts.140.up_proj", "model.layers.90.mlp.experts.141.up_proj", "model.layers.90.mlp.experts.142.up_proj", "model.layers.90.mlp.experts.143.up_proj", "model.layers.90.mlp.experts.144.up_proj", "model.layers.90.mlp.experts.145.up_proj", "model.layers.90.mlp.experts.146.up_proj", "model.layers.90.mlp.experts.147.up_proj", "model.layers.90.mlp.experts.148.up_proj", "model.layers.90.mlp.experts.149.up_proj", "model.layers.90.mlp.experts.150.up_proj", "model.layers.90.mlp.experts.151.up_proj", "model.layers.90.mlp.experts.152.up_proj", "model.layers.90.mlp.experts.153.up_proj", "model.layers.90.mlp.experts.154.up_proj", "model.layers.90.mlp.experts.155.up_proj", "model.layers.90.mlp.experts.156.up_proj", "model.layers.90.mlp.experts.157.up_proj", "model.layers.90.mlp.experts.158.up_proj", "model.layers.90.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": -1.8742866814136505e-08, "dbits": 2516582400 }, { "dkld": -4.607392475007577e-06, "dbits": 5033164800 } ] }, { "idx": 542, "layers": [ "model.layers.90.mlp.experts.0.down_proj", "model.layers.90.mlp.experts.1.down_proj", "model.layers.90.mlp.experts.2.down_proj", "model.layers.90.mlp.experts.3.down_proj", "model.layers.90.mlp.experts.4.down_proj", "model.layers.90.mlp.experts.5.down_proj", "model.layers.90.mlp.experts.6.down_proj", "model.layers.90.mlp.experts.7.down_proj", "model.layers.90.mlp.experts.8.down_proj", "model.layers.90.mlp.experts.9.down_proj", "model.layers.90.mlp.experts.10.down_proj", "model.layers.90.mlp.experts.11.down_proj", "model.layers.90.mlp.experts.12.down_proj", "model.layers.90.mlp.experts.13.down_proj", "model.layers.90.mlp.experts.14.down_proj", "model.layers.90.mlp.experts.15.down_proj", "model.layers.90.mlp.experts.16.down_proj", "model.layers.90.mlp.experts.17.down_proj", "model.layers.90.mlp.experts.18.down_proj", "model.layers.90.mlp.experts.19.down_proj", "model.layers.90.mlp.experts.20.down_proj", "model.layers.90.mlp.experts.21.down_proj", "model.layers.90.mlp.experts.22.down_proj", "model.layers.90.mlp.experts.23.down_proj", "model.layers.90.mlp.experts.24.down_proj", "model.layers.90.mlp.experts.25.down_proj", "model.layers.90.mlp.experts.26.down_proj", "model.layers.90.mlp.experts.27.down_proj", "model.layers.90.mlp.experts.28.down_proj", "model.layers.90.mlp.experts.29.down_proj", "model.layers.90.mlp.experts.30.down_proj", "model.layers.90.mlp.experts.31.down_proj", "model.layers.90.mlp.experts.32.down_proj", "model.layers.90.mlp.experts.33.down_proj", "model.layers.90.mlp.experts.34.down_proj", "model.layers.90.mlp.experts.35.down_proj", "model.layers.90.mlp.experts.36.down_proj", "model.layers.90.mlp.experts.37.down_proj", "model.layers.90.mlp.experts.38.down_proj", "model.layers.90.mlp.experts.39.down_proj", "model.layers.90.mlp.experts.40.down_proj", "model.layers.90.mlp.experts.41.down_proj", "model.layers.90.mlp.experts.42.down_proj", "model.layers.90.mlp.experts.43.down_proj", "model.layers.90.mlp.experts.44.down_proj", "model.layers.90.mlp.experts.45.down_proj", "model.layers.90.mlp.experts.46.down_proj", "model.layers.90.mlp.experts.47.down_proj", "model.layers.90.mlp.experts.48.down_proj", "model.layers.90.mlp.experts.49.down_proj", "model.layers.90.mlp.experts.50.down_proj", "model.layers.90.mlp.experts.51.down_proj", "model.layers.90.mlp.experts.52.down_proj", "model.layers.90.mlp.experts.53.down_proj", "model.layers.90.mlp.experts.54.down_proj", "model.layers.90.mlp.experts.55.down_proj", "model.layers.90.mlp.experts.56.down_proj", "model.layers.90.mlp.experts.57.down_proj", "model.layers.90.mlp.experts.58.down_proj", "model.layers.90.mlp.experts.59.down_proj", "model.layers.90.mlp.experts.60.down_proj", "model.layers.90.mlp.experts.61.down_proj", "model.layers.90.mlp.experts.62.down_proj", "model.layers.90.mlp.experts.63.down_proj", "model.layers.90.mlp.experts.64.down_proj", "model.layers.90.mlp.experts.65.down_proj", "model.layers.90.mlp.experts.66.down_proj", "model.layers.90.mlp.experts.67.down_proj", "model.layers.90.mlp.experts.68.down_proj", "model.layers.90.mlp.experts.69.down_proj", "model.layers.90.mlp.experts.70.down_proj", "model.layers.90.mlp.experts.71.down_proj", "model.layers.90.mlp.experts.72.down_proj", "model.layers.90.mlp.experts.73.down_proj", "model.layers.90.mlp.experts.74.down_proj", "model.layers.90.mlp.experts.75.down_proj", "model.layers.90.mlp.experts.76.down_proj", "model.layers.90.mlp.experts.77.down_proj", "model.layers.90.mlp.experts.78.down_proj", "model.layers.90.mlp.experts.79.down_proj", "model.layers.90.mlp.experts.80.down_proj", "model.layers.90.mlp.experts.81.down_proj", "model.layers.90.mlp.experts.82.down_proj", "model.layers.90.mlp.experts.83.down_proj", "model.layers.90.mlp.experts.84.down_proj", "model.layers.90.mlp.experts.85.down_proj", "model.layers.90.mlp.experts.86.down_proj", "model.layers.90.mlp.experts.87.down_proj", "model.layers.90.mlp.experts.88.down_proj", "model.layers.90.mlp.experts.89.down_proj", "model.layers.90.mlp.experts.90.down_proj", "model.layers.90.mlp.experts.91.down_proj", "model.layers.90.mlp.experts.92.down_proj", "model.layers.90.mlp.experts.93.down_proj", "model.layers.90.mlp.experts.94.down_proj", "model.layers.90.mlp.experts.95.down_proj", "model.layers.90.mlp.experts.96.down_proj", "model.layers.90.mlp.experts.97.down_proj", "model.layers.90.mlp.experts.98.down_proj", "model.layers.90.mlp.experts.99.down_proj", "model.layers.90.mlp.experts.100.down_proj", "model.layers.90.mlp.experts.101.down_proj", "model.layers.90.mlp.experts.102.down_proj", "model.layers.90.mlp.experts.103.down_proj", "model.layers.90.mlp.experts.104.down_proj", "model.layers.90.mlp.experts.105.down_proj", "model.layers.90.mlp.experts.106.down_proj", "model.layers.90.mlp.experts.107.down_proj", "model.layers.90.mlp.experts.108.down_proj", "model.layers.90.mlp.experts.109.down_proj", "model.layers.90.mlp.experts.110.down_proj", "model.layers.90.mlp.experts.111.down_proj", "model.layers.90.mlp.experts.112.down_proj", "model.layers.90.mlp.experts.113.down_proj", "model.layers.90.mlp.experts.114.down_proj", "model.layers.90.mlp.experts.115.down_proj", "model.layers.90.mlp.experts.116.down_proj", "model.layers.90.mlp.experts.117.down_proj", "model.layers.90.mlp.experts.118.down_proj", "model.layers.90.mlp.experts.119.down_proj", "model.layers.90.mlp.experts.120.down_proj", "model.layers.90.mlp.experts.121.down_proj", "model.layers.90.mlp.experts.122.down_proj", "model.layers.90.mlp.experts.123.down_proj", "model.layers.90.mlp.experts.124.down_proj", "model.layers.90.mlp.experts.125.down_proj", "model.layers.90.mlp.experts.126.down_proj", "model.layers.90.mlp.experts.127.down_proj", "model.layers.90.mlp.experts.128.down_proj", "model.layers.90.mlp.experts.129.down_proj", "model.layers.90.mlp.experts.130.down_proj", "model.layers.90.mlp.experts.131.down_proj", "model.layers.90.mlp.experts.132.down_proj", "model.layers.90.mlp.experts.133.down_proj", "model.layers.90.mlp.experts.134.down_proj", "model.layers.90.mlp.experts.135.down_proj", "model.layers.90.mlp.experts.136.down_proj", "model.layers.90.mlp.experts.137.down_proj", "model.layers.90.mlp.experts.138.down_proj", "model.layers.90.mlp.experts.139.down_proj", "model.layers.90.mlp.experts.140.down_proj", "model.layers.90.mlp.experts.141.down_proj", "model.layers.90.mlp.experts.142.down_proj", "model.layers.90.mlp.experts.143.down_proj", "model.layers.90.mlp.experts.144.down_proj", "model.layers.90.mlp.experts.145.down_proj", "model.layers.90.mlp.experts.146.down_proj", "model.layers.90.mlp.experts.147.down_proj", "model.layers.90.mlp.experts.148.down_proj", "model.layers.90.mlp.experts.149.down_proj", "model.layers.90.mlp.experts.150.down_proj", "model.layers.90.mlp.experts.151.down_proj", "model.layers.90.mlp.experts.152.down_proj", "model.layers.90.mlp.experts.153.down_proj", "model.layers.90.mlp.experts.154.down_proj", "model.layers.90.mlp.experts.155.down_proj", "model.layers.90.mlp.experts.156.down_proj", "model.layers.90.mlp.experts.157.down_proj", "model.layers.90.mlp.experts.158.down_proj", "model.layers.90.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 8.152332156896591e-06, "dbits": 1258291200 }, { "dkld": 1.6702804714451708e-06, "dbits": 2516582400 } ] }, { "idx": 543, "layers": [ "model.layers.91.self_attn.q_proj" ], "candidates": [ { "dkld": 2.7457159012556423e-05, "dbits": 62914560 }, { "dkld": 2.9228371568025546e-05, "dbits": 125829120 } ] }, { "idx": 544, "layers": [ "model.layers.91.self_attn.k_proj", "model.layers.91.self_attn.v_proj" ], "candidates": [ { "dkld": -0.00011240593157708575, "dbits": 10485760 }, { "dkld": -0.000131230708211659, "dbits": 20971520 } ] }, { "idx": 545, "layers": [ "model.layers.91.self_attn.o_proj" ], "candidates": [ { "dkld": -7.728366181254318e-05, "dbits": 62914560 }, { "dkld": -8.071868214756112e-05, "dbits": 125829120 } ] }, { "idx": 546, "layers": [ "model.layers.91.mlp.shared_experts.gate_proj", "model.layers.91.mlp.shared_experts.up_proj", "model.layers.91.mlp.shared_experts.down_proj" ], "candidates": [ { "dkld": -0.00019697777461260418, "dbits": 23592960 }, { "dkld": -0.00016054967418312888, "dbits": 47185920 } ] }, { "idx": 547, "layers": [ "model.layers.91.mlp.experts.0.gate_proj", "model.layers.91.mlp.experts.1.gate_proj", "model.layers.91.mlp.experts.2.gate_proj", "model.layers.91.mlp.experts.3.gate_proj", "model.layers.91.mlp.experts.4.gate_proj", "model.layers.91.mlp.experts.5.gate_proj", "model.layers.91.mlp.experts.6.gate_proj", "model.layers.91.mlp.experts.7.gate_proj", "model.layers.91.mlp.experts.8.gate_proj", "model.layers.91.mlp.experts.9.gate_proj", "model.layers.91.mlp.experts.10.gate_proj", "model.layers.91.mlp.experts.11.gate_proj", "model.layers.91.mlp.experts.12.gate_proj", "model.layers.91.mlp.experts.13.gate_proj", "model.layers.91.mlp.experts.14.gate_proj", "model.layers.91.mlp.experts.15.gate_proj", "model.layers.91.mlp.experts.16.gate_proj", "model.layers.91.mlp.experts.17.gate_proj", "model.layers.91.mlp.experts.18.gate_proj", "model.layers.91.mlp.experts.19.gate_proj", "model.layers.91.mlp.experts.20.gate_proj", "model.layers.91.mlp.experts.21.gate_proj", "model.layers.91.mlp.experts.22.gate_proj", "model.layers.91.mlp.experts.23.gate_proj", "model.layers.91.mlp.experts.24.gate_proj", "model.layers.91.mlp.experts.25.gate_proj", "model.layers.91.mlp.experts.26.gate_proj", "model.layers.91.mlp.experts.27.gate_proj", "model.layers.91.mlp.experts.28.gate_proj", "model.layers.91.mlp.experts.29.gate_proj", "model.layers.91.mlp.experts.30.gate_proj", "model.layers.91.mlp.experts.31.gate_proj", "model.layers.91.mlp.experts.32.gate_proj", "model.layers.91.mlp.experts.33.gate_proj", "model.layers.91.mlp.experts.34.gate_proj", "model.layers.91.mlp.experts.35.gate_proj", "model.layers.91.mlp.experts.36.gate_proj", "model.layers.91.mlp.experts.37.gate_proj", "model.layers.91.mlp.experts.38.gate_proj", "model.layers.91.mlp.experts.39.gate_proj", "model.layers.91.mlp.experts.40.gate_proj", "model.layers.91.mlp.experts.41.gate_proj", "model.layers.91.mlp.experts.42.gate_proj", "model.layers.91.mlp.experts.43.gate_proj", "model.layers.91.mlp.experts.44.gate_proj", "model.layers.91.mlp.experts.45.gate_proj", "model.layers.91.mlp.experts.46.gate_proj", "model.layers.91.mlp.experts.47.gate_proj", "model.layers.91.mlp.experts.48.gate_proj", "model.layers.91.mlp.experts.49.gate_proj", "model.layers.91.mlp.experts.50.gate_proj", "model.layers.91.mlp.experts.51.gate_proj", "model.layers.91.mlp.experts.52.gate_proj", "model.layers.91.mlp.experts.53.gate_proj", "model.layers.91.mlp.experts.54.gate_proj", "model.layers.91.mlp.experts.55.gate_proj", "model.layers.91.mlp.experts.56.gate_proj", "model.layers.91.mlp.experts.57.gate_proj", "model.layers.91.mlp.experts.58.gate_proj", "model.layers.91.mlp.experts.59.gate_proj", "model.layers.91.mlp.experts.60.gate_proj", "model.layers.91.mlp.experts.61.gate_proj", "model.layers.91.mlp.experts.62.gate_proj", "model.layers.91.mlp.experts.63.gate_proj", "model.layers.91.mlp.experts.64.gate_proj", "model.layers.91.mlp.experts.65.gate_proj", "model.layers.91.mlp.experts.66.gate_proj", "model.layers.91.mlp.experts.67.gate_proj", "model.layers.91.mlp.experts.68.gate_proj", "model.layers.91.mlp.experts.69.gate_proj", "model.layers.91.mlp.experts.70.gate_proj", "model.layers.91.mlp.experts.71.gate_proj", "model.layers.91.mlp.experts.72.gate_proj", "model.layers.91.mlp.experts.73.gate_proj", "model.layers.91.mlp.experts.74.gate_proj", "model.layers.91.mlp.experts.75.gate_proj", "model.layers.91.mlp.experts.76.gate_proj", "model.layers.91.mlp.experts.77.gate_proj", "model.layers.91.mlp.experts.78.gate_proj", "model.layers.91.mlp.experts.79.gate_proj", "model.layers.91.mlp.experts.80.gate_proj", "model.layers.91.mlp.experts.81.gate_proj", "model.layers.91.mlp.experts.82.gate_proj", "model.layers.91.mlp.experts.83.gate_proj", "model.layers.91.mlp.experts.84.gate_proj", "model.layers.91.mlp.experts.85.gate_proj", "model.layers.91.mlp.experts.86.gate_proj", "model.layers.91.mlp.experts.87.gate_proj", "model.layers.91.mlp.experts.88.gate_proj", "model.layers.91.mlp.experts.89.gate_proj", "model.layers.91.mlp.experts.90.gate_proj", "model.layers.91.mlp.experts.91.gate_proj", "model.layers.91.mlp.experts.92.gate_proj", "model.layers.91.mlp.experts.93.gate_proj", "model.layers.91.mlp.experts.94.gate_proj", "model.layers.91.mlp.experts.95.gate_proj", "model.layers.91.mlp.experts.96.gate_proj", "model.layers.91.mlp.experts.97.gate_proj", "model.layers.91.mlp.experts.98.gate_proj", "model.layers.91.mlp.experts.99.gate_proj", "model.layers.91.mlp.experts.100.gate_proj", "model.layers.91.mlp.experts.101.gate_proj", "model.layers.91.mlp.experts.102.gate_proj", "model.layers.91.mlp.experts.103.gate_proj", "model.layers.91.mlp.experts.104.gate_proj", "model.layers.91.mlp.experts.105.gate_proj", "model.layers.91.mlp.experts.106.gate_proj", "model.layers.91.mlp.experts.107.gate_proj", "model.layers.91.mlp.experts.108.gate_proj", "model.layers.91.mlp.experts.109.gate_proj", "model.layers.91.mlp.experts.110.gate_proj", "model.layers.91.mlp.experts.111.gate_proj", "model.layers.91.mlp.experts.112.gate_proj", "model.layers.91.mlp.experts.113.gate_proj", "model.layers.91.mlp.experts.114.gate_proj", "model.layers.91.mlp.experts.115.gate_proj", "model.layers.91.mlp.experts.116.gate_proj", "model.layers.91.mlp.experts.117.gate_proj", "model.layers.91.mlp.experts.118.gate_proj", "model.layers.91.mlp.experts.119.gate_proj", "model.layers.91.mlp.experts.120.gate_proj", "model.layers.91.mlp.experts.121.gate_proj", "model.layers.91.mlp.experts.122.gate_proj", "model.layers.91.mlp.experts.123.gate_proj", "model.layers.91.mlp.experts.124.gate_proj", "model.layers.91.mlp.experts.125.gate_proj", "model.layers.91.mlp.experts.126.gate_proj", "model.layers.91.mlp.experts.127.gate_proj", "model.layers.91.mlp.experts.128.gate_proj", "model.layers.91.mlp.experts.129.gate_proj", "model.layers.91.mlp.experts.130.gate_proj", "model.layers.91.mlp.experts.131.gate_proj", "model.layers.91.mlp.experts.132.gate_proj", "model.layers.91.mlp.experts.133.gate_proj", "model.layers.91.mlp.experts.134.gate_proj", "model.layers.91.mlp.experts.135.gate_proj", "model.layers.91.mlp.experts.136.gate_proj", "model.layers.91.mlp.experts.137.gate_proj", "model.layers.91.mlp.experts.138.gate_proj", "model.layers.91.mlp.experts.139.gate_proj", "model.layers.91.mlp.experts.140.gate_proj", "model.layers.91.mlp.experts.141.gate_proj", "model.layers.91.mlp.experts.142.gate_proj", "model.layers.91.mlp.experts.143.gate_proj", "model.layers.91.mlp.experts.144.gate_proj", "model.layers.91.mlp.experts.145.gate_proj", "model.layers.91.mlp.experts.146.gate_proj", "model.layers.91.mlp.experts.147.gate_proj", "model.layers.91.mlp.experts.148.gate_proj", "model.layers.91.mlp.experts.149.gate_proj", "model.layers.91.mlp.experts.150.gate_proj", "model.layers.91.mlp.experts.151.gate_proj", "model.layers.91.mlp.experts.152.gate_proj", "model.layers.91.mlp.experts.153.gate_proj", "model.layers.91.mlp.experts.154.gate_proj", "model.layers.91.mlp.experts.155.gate_proj", "model.layers.91.mlp.experts.156.gate_proj", "model.layers.91.mlp.experts.157.gate_proj", "model.layers.91.mlp.experts.158.gate_proj", "model.layers.91.mlp.experts.159.gate_proj", "model.layers.91.mlp.experts.0.up_proj", "model.layers.91.mlp.experts.1.up_proj", "model.layers.91.mlp.experts.2.up_proj", "model.layers.91.mlp.experts.3.up_proj", "model.layers.91.mlp.experts.4.up_proj", "model.layers.91.mlp.experts.5.up_proj", "model.layers.91.mlp.experts.6.up_proj", "model.layers.91.mlp.experts.7.up_proj", "model.layers.91.mlp.experts.8.up_proj", "model.layers.91.mlp.experts.9.up_proj", "model.layers.91.mlp.experts.10.up_proj", "model.layers.91.mlp.experts.11.up_proj", "model.layers.91.mlp.experts.12.up_proj", "model.layers.91.mlp.experts.13.up_proj", "model.layers.91.mlp.experts.14.up_proj", "model.layers.91.mlp.experts.15.up_proj", "model.layers.91.mlp.experts.16.up_proj", "model.layers.91.mlp.experts.17.up_proj", "model.layers.91.mlp.experts.18.up_proj", "model.layers.91.mlp.experts.19.up_proj", "model.layers.91.mlp.experts.20.up_proj", "model.layers.91.mlp.experts.21.up_proj", "model.layers.91.mlp.experts.22.up_proj", "model.layers.91.mlp.experts.23.up_proj", "model.layers.91.mlp.experts.24.up_proj", "model.layers.91.mlp.experts.25.up_proj", "model.layers.91.mlp.experts.26.up_proj", "model.layers.91.mlp.experts.27.up_proj", "model.layers.91.mlp.experts.28.up_proj", "model.layers.91.mlp.experts.29.up_proj", "model.layers.91.mlp.experts.30.up_proj", "model.layers.91.mlp.experts.31.up_proj", "model.layers.91.mlp.experts.32.up_proj", "model.layers.91.mlp.experts.33.up_proj", "model.layers.91.mlp.experts.34.up_proj", "model.layers.91.mlp.experts.35.up_proj", "model.layers.91.mlp.experts.36.up_proj", "model.layers.91.mlp.experts.37.up_proj", "model.layers.91.mlp.experts.38.up_proj", "model.layers.91.mlp.experts.39.up_proj", "model.layers.91.mlp.experts.40.up_proj", "model.layers.91.mlp.experts.41.up_proj", "model.layers.91.mlp.experts.42.up_proj", "model.layers.91.mlp.experts.43.up_proj", "model.layers.91.mlp.experts.44.up_proj", "model.layers.91.mlp.experts.45.up_proj", "model.layers.91.mlp.experts.46.up_proj", "model.layers.91.mlp.experts.47.up_proj", "model.layers.91.mlp.experts.48.up_proj", "model.layers.91.mlp.experts.49.up_proj", "model.layers.91.mlp.experts.50.up_proj", "model.layers.91.mlp.experts.51.up_proj", "model.layers.91.mlp.experts.52.up_proj", "model.layers.91.mlp.experts.53.up_proj", "model.layers.91.mlp.experts.54.up_proj", "model.layers.91.mlp.experts.55.up_proj", "model.layers.91.mlp.experts.56.up_proj", "model.layers.91.mlp.experts.57.up_proj", "model.layers.91.mlp.experts.58.up_proj", "model.layers.91.mlp.experts.59.up_proj", "model.layers.91.mlp.experts.60.up_proj", "model.layers.91.mlp.experts.61.up_proj", "model.layers.91.mlp.experts.62.up_proj", "model.layers.91.mlp.experts.63.up_proj", "model.layers.91.mlp.experts.64.up_proj", "model.layers.91.mlp.experts.65.up_proj", "model.layers.91.mlp.experts.66.up_proj", "model.layers.91.mlp.experts.67.up_proj", "model.layers.91.mlp.experts.68.up_proj", "model.layers.91.mlp.experts.69.up_proj", "model.layers.91.mlp.experts.70.up_proj", "model.layers.91.mlp.experts.71.up_proj", "model.layers.91.mlp.experts.72.up_proj", "model.layers.91.mlp.experts.73.up_proj", "model.layers.91.mlp.experts.74.up_proj", "model.layers.91.mlp.experts.75.up_proj", "model.layers.91.mlp.experts.76.up_proj", "model.layers.91.mlp.experts.77.up_proj", "model.layers.91.mlp.experts.78.up_proj", "model.layers.91.mlp.experts.79.up_proj", "model.layers.91.mlp.experts.80.up_proj", "model.layers.91.mlp.experts.81.up_proj", "model.layers.91.mlp.experts.82.up_proj", "model.layers.91.mlp.experts.83.up_proj", "model.layers.91.mlp.experts.84.up_proj", "model.layers.91.mlp.experts.85.up_proj", "model.layers.91.mlp.experts.86.up_proj", "model.layers.91.mlp.experts.87.up_proj", "model.layers.91.mlp.experts.88.up_proj", "model.layers.91.mlp.experts.89.up_proj", "model.layers.91.mlp.experts.90.up_proj", "model.layers.91.mlp.experts.91.up_proj", "model.layers.91.mlp.experts.92.up_proj", "model.layers.91.mlp.experts.93.up_proj", "model.layers.91.mlp.experts.94.up_proj", "model.layers.91.mlp.experts.95.up_proj", "model.layers.91.mlp.experts.96.up_proj", "model.layers.91.mlp.experts.97.up_proj", "model.layers.91.mlp.experts.98.up_proj", "model.layers.91.mlp.experts.99.up_proj", "model.layers.91.mlp.experts.100.up_proj", "model.layers.91.mlp.experts.101.up_proj", "model.layers.91.mlp.experts.102.up_proj", "model.layers.91.mlp.experts.103.up_proj", "model.layers.91.mlp.experts.104.up_proj", "model.layers.91.mlp.experts.105.up_proj", "model.layers.91.mlp.experts.106.up_proj", "model.layers.91.mlp.experts.107.up_proj", "model.layers.91.mlp.experts.108.up_proj", "model.layers.91.mlp.experts.109.up_proj", "model.layers.91.mlp.experts.110.up_proj", "model.layers.91.mlp.experts.111.up_proj", "model.layers.91.mlp.experts.112.up_proj", "model.layers.91.mlp.experts.113.up_proj", "model.layers.91.mlp.experts.114.up_proj", "model.layers.91.mlp.experts.115.up_proj", "model.layers.91.mlp.experts.116.up_proj", "model.layers.91.mlp.experts.117.up_proj", "model.layers.91.mlp.experts.118.up_proj", "model.layers.91.mlp.experts.119.up_proj", "model.layers.91.mlp.experts.120.up_proj", "model.layers.91.mlp.experts.121.up_proj", "model.layers.91.mlp.experts.122.up_proj", "model.layers.91.mlp.experts.123.up_proj", "model.layers.91.mlp.experts.124.up_proj", "model.layers.91.mlp.experts.125.up_proj", "model.layers.91.mlp.experts.126.up_proj", "model.layers.91.mlp.experts.127.up_proj", "model.layers.91.mlp.experts.128.up_proj", "model.layers.91.mlp.experts.129.up_proj", "model.layers.91.mlp.experts.130.up_proj", "model.layers.91.mlp.experts.131.up_proj", "model.layers.91.mlp.experts.132.up_proj", "model.layers.91.mlp.experts.133.up_proj", "model.layers.91.mlp.experts.134.up_proj", "model.layers.91.mlp.experts.135.up_proj", "model.layers.91.mlp.experts.136.up_proj", "model.layers.91.mlp.experts.137.up_proj", "model.layers.91.mlp.experts.138.up_proj", "model.layers.91.mlp.experts.139.up_proj", "model.layers.91.mlp.experts.140.up_proj", "model.layers.91.mlp.experts.141.up_proj", "model.layers.91.mlp.experts.142.up_proj", "model.layers.91.mlp.experts.143.up_proj", "model.layers.91.mlp.experts.144.up_proj", "model.layers.91.mlp.experts.145.up_proj", "model.layers.91.mlp.experts.146.up_proj", "model.layers.91.mlp.experts.147.up_proj", "model.layers.91.mlp.experts.148.up_proj", "model.layers.91.mlp.experts.149.up_proj", "model.layers.91.mlp.experts.150.up_proj", "model.layers.91.mlp.experts.151.up_proj", "model.layers.91.mlp.experts.152.up_proj", "model.layers.91.mlp.experts.153.up_proj", "model.layers.91.mlp.experts.154.up_proj", "model.layers.91.mlp.experts.155.up_proj", "model.layers.91.mlp.experts.156.up_proj", "model.layers.91.mlp.experts.157.up_proj", "model.layers.91.mlp.experts.158.up_proj", "model.layers.91.mlp.experts.159.up_proj" ], "candidates": [ { "dkld": 1.0231509804739525e-06, "dbits": 2516582400 }, { "dkld": -5.585351027547966e-06, "dbits": 5033164800 } ] }, { "idx": 548, "layers": [ "model.layers.91.mlp.experts.0.down_proj", "model.layers.91.mlp.experts.1.down_proj", "model.layers.91.mlp.experts.2.down_proj", "model.layers.91.mlp.experts.3.down_proj", "model.layers.91.mlp.experts.4.down_proj", "model.layers.91.mlp.experts.5.down_proj", "model.layers.91.mlp.experts.6.down_proj", "model.layers.91.mlp.experts.7.down_proj", "model.layers.91.mlp.experts.8.down_proj", "model.layers.91.mlp.experts.9.down_proj", "model.layers.91.mlp.experts.10.down_proj", "model.layers.91.mlp.experts.11.down_proj", "model.layers.91.mlp.experts.12.down_proj", "model.layers.91.mlp.experts.13.down_proj", "model.layers.91.mlp.experts.14.down_proj", "model.layers.91.mlp.experts.15.down_proj", "model.layers.91.mlp.experts.16.down_proj", "model.layers.91.mlp.experts.17.down_proj", "model.layers.91.mlp.experts.18.down_proj", "model.layers.91.mlp.experts.19.down_proj", "model.layers.91.mlp.experts.20.down_proj", "model.layers.91.mlp.experts.21.down_proj", "model.layers.91.mlp.experts.22.down_proj", "model.layers.91.mlp.experts.23.down_proj", "model.layers.91.mlp.experts.24.down_proj", "model.layers.91.mlp.experts.25.down_proj", "model.layers.91.mlp.experts.26.down_proj", "model.layers.91.mlp.experts.27.down_proj", "model.layers.91.mlp.experts.28.down_proj", "model.layers.91.mlp.experts.29.down_proj", "model.layers.91.mlp.experts.30.down_proj", "model.layers.91.mlp.experts.31.down_proj", "model.layers.91.mlp.experts.32.down_proj", "model.layers.91.mlp.experts.33.down_proj", "model.layers.91.mlp.experts.34.down_proj", "model.layers.91.mlp.experts.35.down_proj", "model.layers.91.mlp.experts.36.down_proj", "model.layers.91.mlp.experts.37.down_proj", "model.layers.91.mlp.experts.38.down_proj", "model.layers.91.mlp.experts.39.down_proj", "model.layers.91.mlp.experts.40.down_proj", "model.layers.91.mlp.experts.41.down_proj", "model.layers.91.mlp.experts.42.down_proj", "model.layers.91.mlp.experts.43.down_proj", "model.layers.91.mlp.experts.44.down_proj", "model.layers.91.mlp.experts.45.down_proj", "model.layers.91.mlp.experts.46.down_proj", "model.layers.91.mlp.experts.47.down_proj", "model.layers.91.mlp.experts.48.down_proj", "model.layers.91.mlp.experts.49.down_proj", "model.layers.91.mlp.experts.50.down_proj", "model.layers.91.mlp.experts.51.down_proj", "model.layers.91.mlp.experts.52.down_proj", "model.layers.91.mlp.experts.53.down_proj", "model.layers.91.mlp.experts.54.down_proj", "model.layers.91.mlp.experts.55.down_proj", "model.layers.91.mlp.experts.56.down_proj", "model.layers.91.mlp.experts.57.down_proj", "model.layers.91.mlp.experts.58.down_proj", "model.layers.91.mlp.experts.59.down_proj", "model.layers.91.mlp.experts.60.down_proj", "model.layers.91.mlp.experts.61.down_proj", "model.layers.91.mlp.experts.62.down_proj", "model.layers.91.mlp.experts.63.down_proj", "model.layers.91.mlp.experts.64.down_proj", "model.layers.91.mlp.experts.65.down_proj", "model.layers.91.mlp.experts.66.down_proj", "model.layers.91.mlp.experts.67.down_proj", "model.layers.91.mlp.experts.68.down_proj", "model.layers.91.mlp.experts.69.down_proj", "model.layers.91.mlp.experts.70.down_proj", "model.layers.91.mlp.experts.71.down_proj", "model.layers.91.mlp.experts.72.down_proj", "model.layers.91.mlp.experts.73.down_proj", "model.layers.91.mlp.experts.74.down_proj", "model.layers.91.mlp.experts.75.down_proj", "model.layers.91.mlp.experts.76.down_proj", "model.layers.91.mlp.experts.77.down_proj", "model.layers.91.mlp.experts.78.down_proj", "model.layers.91.mlp.experts.79.down_proj", "model.layers.91.mlp.experts.80.down_proj", "model.layers.91.mlp.experts.81.down_proj", "model.layers.91.mlp.experts.82.down_proj", "model.layers.91.mlp.experts.83.down_proj", "model.layers.91.mlp.experts.84.down_proj", "model.layers.91.mlp.experts.85.down_proj", "model.layers.91.mlp.experts.86.down_proj", "model.layers.91.mlp.experts.87.down_proj", "model.layers.91.mlp.experts.88.down_proj", "model.layers.91.mlp.experts.89.down_proj", "model.layers.91.mlp.experts.90.down_proj", "model.layers.91.mlp.experts.91.down_proj", "model.layers.91.mlp.experts.92.down_proj", "model.layers.91.mlp.experts.93.down_proj", "model.layers.91.mlp.experts.94.down_proj", "model.layers.91.mlp.experts.95.down_proj", "model.layers.91.mlp.experts.96.down_proj", "model.layers.91.mlp.experts.97.down_proj", "model.layers.91.mlp.experts.98.down_proj", "model.layers.91.mlp.experts.99.down_proj", "model.layers.91.mlp.experts.100.down_proj", "model.layers.91.mlp.experts.101.down_proj", "model.layers.91.mlp.experts.102.down_proj", "model.layers.91.mlp.experts.103.down_proj", "model.layers.91.mlp.experts.104.down_proj", "model.layers.91.mlp.experts.105.down_proj", "model.layers.91.mlp.experts.106.down_proj", "model.layers.91.mlp.experts.107.down_proj", "model.layers.91.mlp.experts.108.down_proj", "model.layers.91.mlp.experts.109.down_proj", "model.layers.91.mlp.experts.110.down_proj", "model.layers.91.mlp.experts.111.down_proj", "model.layers.91.mlp.experts.112.down_proj", "model.layers.91.mlp.experts.113.down_proj", "model.layers.91.mlp.experts.114.down_proj", "model.layers.91.mlp.experts.115.down_proj", "model.layers.91.mlp.experts.116.down_proj", "model.layers.91.mlp.experts.117.down_proj", "model.layers.91.mlp.experts.118.down_proj", "model.layers.91.mlp.experts.119.down_proj", "model.layers.91.mlp.experts.120.down_proj", "model.layers.91.mlp.experts.121.down_proj", "model.layers.91.mlp.experts.122.down_proj", "model.layers.91.mlp.experts.123.down_proj", "model.layers.91.mlp.experts.124.down_proj", "model.layers.91.mlp.experts.125.down_proj", "model.layers.91.mlp.experts.126.down_proj", "model.layers.91.mlp.experts.127.down_proj", "model.layers.91.mlp.experts.128.down_proj", "model.layers.91.mlp.experts.129.down_proj", "model.layers.91.mlp.experts.130.down_proj", "model.layers.91.mlp.experts.131.down_proj", "model.layers.91.mlp.experts.132.down_proj", "model.layers.91.mlp.experts.133.down_proj", "model.layers.91.mlp.experts.134.down_proj", "model.layers.91.mlp.experts.135.down_proj", "model.layers.91.mlp.experts.136.down_proj", "model.layers.91.mlp.experts.137.down_proj", "model.layers.91.mlp.experts.138.down_proj", "model.layers.91.mlp.experts.139.down_proj", "model.layers.91.mlp.experts.140.down_proj", "model.layers.91.mlp.experts.141.down_proj", "model.layers.91.mlp.experts.142.down_proj", "model.layers.91.mlp.experts.143.down_proj", "model.layers.91.mlp.experts.144.down_proj", "model.layers.91.mlp.experts.145.down_proj", "model.layers.91.mlp.experts.146.down_proj", "model.layers.91.mlp.experts.147.down_proj", "model.layers.91.mlp.experts.148.down_proj", "model.layers.91.mlp.experts.149.down_proj", "model.layers.91.mlp.experts.150.down_proj", "model.layers.91.mlp.experts.151.down_proj", "model.layers.91.mlp.experts.152.down_proj", "model.layers.91.mlp.experts.153.down_proj", "model.layers.91.mlp.experts.154.down_proj", "model.layers.91.mlp.experts.155.down_proj", "model.layers.91.mlp.experts.156.down_proj", "model.layers.91.mlp.experts.157.down_proj", "model.layers.91.mlp.experts.158.down_proj", "model.layers.91.mlp.experts.159.down_proj" ], "candidates": [ { "dkld": 1.9470462575554848e-06, "dbits": 1258291200 }, { "dkld": -5.550682544708252e-07, "dbits": 2516582400 } ] } ], "base_kld": 0.0132547739893198, "arch_string": "Glm4MoeForCausalLM" }